diff --git "a/wandb/run-20220301_013112-3e2necnj/files/wandb-summary.json" "b/wandb/run-20220301_013112-3e2necnj/files/wandb-summary.json" --- "a/wandb/run-20220301_013112-3e2necnj/files/wandb-summary.json" +++ "b/wandb/run-20220301_013112-3e2necnj/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 3.5579, "train/learning_rate": 9.345794392523364e-08, "train/epoch": 1.0, "train/global_step": 1784, "_runtime": 9916, "_timestamp": 1646108188, "_step": 1788, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 20.0, 421.0, 554.0, 21.0, 0.0, 0.0, 2.0, 1.0], "bins": [-573.1256713867188, -563.2627563476562, -553.3998413085938, -543.5369873046875, -533.674072265625, -523.8111572265625, -513.9482421875, -504.0853271484375, -494.2224426269531, -484.3595275878906, -474.49664306640625, -464.63372802734375, -454.77081298828125, -444.9079284667969, -435.0450134277344, -425.18212890625, -415.3192138671875, -405.456298828125, -395.5934143066406, -385.7304992675781, -375.8675842285156, -366.00469970703125, -356.14178466796875, -346.27886962890625, -336.41595458984375, -326.55303955078125, -316.6901550292969, -306.8272399902344, -296.9643249511719, -287.1014404296875, -277.238525390625, -267.3756103515625, -257.5126953125, -247.64979553222656, -237.78688049316406, -227.92398071289062, -218.0610809326172, -208.19818115234375, -198.33526611328125, -188.4723663330078, -178.60946655273438, -168.74656677246094, -158.88365173339844, -149.020751953125, -139.15785217285156, -129.29495239257812, -119.43203735351562, -109.56913757324219, -99.70622253417969, -89.84331512451172, -79.98041534423828, -70.11750793457031, -60.25460433959961, -50.391700744628906, -40.52879333496094, -30.6658935546875, -20.802989959716797, -10.940085411071777, -1.0771808624267578, 8.785724639892578, 18.64862823486328, 28.511531829833984, 38.37443923950195, 48.23733901977539, 58.10024642944336]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 3.0, 3.0, 5.0, 2.0, 8.0, 9.0, 14.0, 11.0, 17.0, 21.0, 24.0, 25.0, 30.0, 26.0, 39.0, 40.0, 38.0, 43.0, 54.0, 42.0, 45.0, 42.0, 57.0, 37.0, 38.0, 45.0, 41.0, 37.0, 26.0, 28.0, 32.0, 21.0, 10.0, 17.0, 23.0, 9.0, 12.0, 10.0, 4.0, 11.0, 5.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-80.35408020019531, -78.11407470703125, -75.87406921386719, -73.63406372070312, -71.39405822753906, -69.154052734375, -66.91404724121094, -64.67404174804688, -62.43403625488281, -60.19403076171875, -57.95402526855469, -55.714019775390625, -53.47401428222656, -51.2340087890625, -48.99400329589844, -46.753997802734375, -44.51398849487305, -42.273983001708984, -40.03397750854492, -37.79397201538086, -35.5539665222168, -33.313961029052734, -31.07395362854004, -28.833948135375977, -26.593942642211914, -24.35393714904785, -22.11393165588379, -19.873924255371094, -17.63391876220703, -15.393914222717285, -13.153907775878906, -10.913902282714844, -8.673896789550781, -6.433891296386719, -4.193885326385498, -1.9538793563842773, 0.28612613677978516, 2.5261316299438477, 4.766138076782227, 7.006143569946289, 9.246149063110352, 11.486154556274414, 13.726160049438477, 15.966166496276855, 18.206172943115234, 20.446178436279297, 22.68618392944336, 24.926189422607422, 27.166194915771484, 29.406200408935547, 31.64620590209961, 33.88621139526367, 36.126216888427734, 38.3662223815918, 40.606231689453125, 42.84623718261719, 45.08624267578125, 47.32624816894531, 49.566253662109375, 51.80625915527344, 54.0462646484375, 56.28627014160156, 58.526275634765625, 60.76628112792969, 63.00628662109375]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 5.0, 7.0, 13.0, 20.0, 22.0, 27.0, 30.0, 48.0, 41.0, 58.0, 54.0, 51.0, 62.0, 54.0, 71.0, 57.0, 61.0, 53.0, 49.0, 38.0, 36.0, 40.0, 24.0, 21.0, 15.0, 14.0, 13.0, 5.0, 7.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.92578125, -6.7642822265625, -6.602783203125, -6.4412841796875, -6.27978515625, -6.1182861328125, -5.956787109375, -5.7952880859375, -5.6337890625, -5.4722900390625, -5.310791015625, -5.1492919921875, -4.98779296875, -4.8262939453125, -4.664794921875, -4.5032958984375, -4.341796875, -4.1802978515625, -4.018798828125, -3.8572998046875, -3.69580078125, -3.5343017578125, -3.372802734375, -3.2113037109375, -3.0498046875, -2.8883056640625, -2.726806640625, -2.5653076171875, -2.40380859375, -2.2423095703125, -2.080810546875, -1.9193115234375, -1.7578125, -1.5963134765625, -1.434814453125, -1.2733154296875, -1.11181640625, -0.9503173828125, -0.788818359375, -0.6273193359375, -0.4658203125, -0.3043212890625, -0.142822265625, 0.0186767578125, 0.18017578125, 0.3416748046875, 0.503173828125, 0.6646728515625, 0.826171875, 0.9876708984375, 1.149169921875, 1.3106689453125, 1.47216796875, 1.6336669921875, 1.795166015625, 1.9566650390625, 2.1181640625, 2.2796630859375, 2.441162109375, 2.6026611328125, 2.76416015625, 2.9256591796875, 3.087158203125, 3.2486572265625, 3.41015625]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 4.0, 2.0, 3.0, 9.0, 4.0, 9.0, 11.0, 17.0, 30.0, 62.0, 86.0, 116.0, 172.0, 373.0, 714.0, 1670.0, 5326.0, 26656.0, 482826.0, 3521891.0, 133920.0, 14339.0, 3441.0, 1325.0, 585.0, 289.0, 163.0, 85.0, 52.0, 40.0, 23.0, 17.0, 9.0, 12.0, 8.0, 1.0, 1.0], "bins": [-33.09375, -32.37939453125, -31.6650390625, -30.95068359375, -30.236328125, -29.52197265625, -28.8076171875, -28.09326171875, -27.37890625, -26.66455078125, -25.9501953125, -25.23583984375, -24.521484375, -23.80712890625, -23.0927734375, -22.37841796875, -21.6640625, -20.94970703125, -20.2353515625, -19.52099609375, -18.806640625, -18.09228515625, -17.3779296875, -16.66357421875, -15.94921875, -15.23486328125, -14.5205078125, -13.80615234375, -13.091796875, -12.37744140625, -11.6630859375, -10.94873046875, -10.234375, -9.52001953125, -8.8056640625, -8.09130859375, -7.376953125, -6.66259765625, -5.9482421875, -5.23388671875, -4.51953125, -3.80517578125, -3.0908203125, -2.37646484375, -1.662109375, -0.94775390625, -0.2333984375, 0.48095703125, 1.1953125, 1.90966796875, 2.6240234375, 3.33837890625, 4.052734375, 4.76708984375, 5.4814453125, 6.19580078125, 6.91015625, 7.62451171875, 8.3388671875, 9.05322265625, 9.767578125, 10.48193359375, 11.1962890625, 11.91064453125, 12.625]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 6.0, 8.0, 14.0, 34.0, 44.0, 74.0, 135.0, 237.0, 330.0, 585.0, 820.0, 699.0, 430.0, 254.0, 149.0, 100.0, 56.0, 34.0, 28.0, 16.0, 10.0, 2.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.890625, -15.219482421875, -14.54833984375, -13.877197265625, -13.2060546875, -12.534912109375, -11.86376953125, -11.192626953125, -10.521484375, -9.850341796875, -9.17919921875, -8.508056640625, -7.8369140625, -7.165771484375, -6.49462890625, -5.823486328125, -5.15234375, -4.481201171875, -3.81005859375, -3.138916015625, -2.4677734375, -1.796630859375, -1.12548828125, -0.454345703125, 0.216796875, 0.887939453125, 1.55908203125, 2.230224609375, 2.9013671875, 3.572509765625, 4.24365234375, 4.914794921875, 5.5859375, 6.257080078125, 6.92822265625, 7.599365234375, 8.2705078125, 8.941650390625, 9.61279296875, 10.283935546875, 10.955078125, 11.626220703125, 12.29736328125, 12.968505859375, 13.6396484375, 14.310791015625, 14.98193359375, 15.653076171875, 16.32421875, 16.995361328125, 17.66650390625, 18.337646484375, 19.0087890625, 19.679931640625, 20.35107421875, 21.022216796875, 21.693359375, 22.364501953125, 23.03564453125, 23.706787109375, 24.3779296875, 25.049072265625, 25.72021484375, 26.391357421875, 27.0625]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 4.0, 8.0, 18.0, 26.0, 29.0, 66.0, 112.0, 262.0, 565.0, 1339.0, 4538.0, 526046.0, 3648990.0, 9143.0, 1741.0, 686.0, 325.0, 153.0, 91.0, 62.0, 29.0, 12.0, 8.0, 4.0, 6.0, 5.0, 1.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-72.5625, -70.1552734375, -67.748046875, -65.3408203125, -62.93359375, -60.5263671875, -58.119140625, -55.7119140625, -53.3046875, -50.8974609375, -48.490234375, -46.0830078125, -43.67578125, -41.2685546875, -38.861328125, -36.4541015625, -34.046875, -31.6396484375, -29.232421875, -26.8251953125, -24.41796875, -22.0107421875, -19.603515625, -17.1962890625, -14.7890625, -12.3818359375, -9.974609375, -7.5673828125, -5.16015625, -2.7529296875, -0.345703125, 2.0615234375, 4.46875, 6.8759765625, 9.283203125, 11.6904296875, 14.09765625, 16.5048828125, 18.912109375, 21.3193359375, 23.7265625, 26.1337890625, 28.541015625, 30.9482421875, 33.35546875, 35.7626953125, 38.169921875, 40.5771484375, 42.984375, 45.3916015625, 47.798828125, 50.2060546875, 52.61328125, 55.0205078125, 57.427734375, 59.8349609375, 62.2421875, 64.6494140625, 67.056640625, 69.4638671875, 71.87109375, 74.2783203125, 76.685546875, 79.0927734375, 81.5]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 16.0, 44.0, 193.0, 425.0, 243.0, 73.0, 14.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-212.2716064453125, -208.23072814941406, -204.18984985351562, -200.1489715576172, -196.10809326171875, -192.0672149658203, -188.02633666992188, -183.9854736328125, -179.944580078125, -175.90370178222656, -171.86282348632812, -167.8219451904297, -163.78106689453125, -159.7401885986328, -155.69931030273438, -151.658447265625, -147.61756896972656, -143.57669067382812, -139.5358123779297, -135.49493408203125, -131.4540557861328, -127.41317749023438, -123.37230682373047, -119.33142852783203, -115.2905502319336, -111.24967193603516, -107.20879364013672, -103.16791534423828, -99.12704467773438, -95.08616638183594, -91.0452880859375, -87.00440979003906, -82.96353149414062, -78.92265319824219, -74.88177490234375, -70.84089660644531, -66.80001831054688, -62.7591438293457, -58.71826934814453, -54.677391052246094, -50.63651657104492, -46.595638275146484, -42.55476379394531, -38.513885498046875, -34.47300720214844, -30.43212890625, -26.391252517700195, -22.35037612915039, -18.309497833251953, -14.268620491027832, -10.227743148803711, -6.18686580657959, -2.1459884643554688, 1.8948898315429688, 5.935766220092773, 9.976642608642578, 14.017520904541016, 18.058399200439453, 22.099275588989258, 26.140151977539062, 30.1810302734375, 34.22190856933594, 38.262786865234375, 42.30366134643555, 46.344539642333984]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 1.0, 5.0, 9.0, 5.0, 12.0, 5.0, 20.0, 14.0, 16.0, 19.0, 22.0, 21.0, 16.0, 37.0, 31.0, 42.0, 26.0, 30.0, 44.0, 38.0, 37.0, 30.0, 30.0, 37.0, 39.0, 41.0, 33.0, 51.0, 31.0, 34.0, 28.0, 28.0, 21.0, 19.0, 14.0, 27.0, 12.0, 11.0, 7.0, 13.0, 6.0, 7.0, 6.0, 10.0, 6.0, 1.0, 4.0, 0.0, 1.0, 3.0, 3.0], "bins": [-44.282958984375, -43.00820541381836, -41.73345184326172, -40.45869827270508, -39.18394470214844, -37.9091911315918, -36.634437561035156, -35.35968780517578, -34.084930419921875, -32.810176849365234, -31.535423278808594, -30.260669708251953, -28.985916137695312, -27.711162567138672, -26.436410903930664, -25.161657333374023, -23.886905670166016, -22.612152099609375, -21.337398529052734, -20.062644958496094, -18.787891387939453, -17.513137817382812, -16.238386154174805, -14.963632583618164, -13.688879013061523, -12.414125442504883, -11.139371871948242, -9.864619255065918, -8.589865684509277, -7.315112113952637, -6.040359020233154, -4.765605926513672, -3.4908523559570312, -2.2160990238189697, -0.9413456916809082, 0.3334076404571533, 1.6081609725952148, 2.8829145431518555, 4.157667636871338, 5.43242073059082, 6.707174301147461, 7.981927871704102, 9.256681442260742, 10.531434059143066, 11.806187629699707, 13.080941200256348, 14.355693817138672, 15.630447387695312, 16.905200958251953, 18.179954528808594, 19.454708099365234, 20.729461669921875, 22.004215240478516, 23.278968811035156, 24.553720474243164, 25.828474044799805, 27.103227615356445, 28.377981185913086, 29.652734756469727, 30.927488327026367, 32.202239990234375, 33.476993560791016, 34.751747131347656, 36.0265007019043, 37.30125427246094]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 7.0, 4.0, 4.0, 16.0, 20.0, 17.0, 28.0, 26.0, 46.0, 33.0, 54.0, 58.0, 44.0, 50.0, 50.0, 70.0, 60.0, 62.0, 52.0, 41.0, 55.0, 30.0, 42.0, 39.0, 31.0, 16.0, 18.0, 13.0, 10.0, 3.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.3828125, -6.216796875, -6.05078125, -5.884765625, -5.71875, -5.552734375, -5.38671875, -5.220703125, -5.0546875, -4.888671875, -4.72265625, -4.556640625, -4.390625, -4.224609375, -4.05859375, -3.892578125, -3.7265625, -3.560546875, -3.39453125, -3.228515625, -3.0625, -2.896484375, -2.73046875, -2.564453125, -2.3984375, -2.232421875, -2.06640625, -1.900390625, -1.734375, -1.568359375, -1.40234375, -1.236328125, -1.0703125, -0.904296875, -0.73828125, -0.572265625, -0.40625, -0.240234375, -0.07421875, 0.091796875, 0.2578125, 0.423828125, 0.58984375, 0.755859375, 0.921875, 1.087890625, 1.25390625, 1.419921875, 1.5859375, 1.751953125, 1.91796875, 2.083984375, 2.25, 2.416015625, 2.58203125, 2.748046875, 2.9140625, 3.080078125, 3.24609375, 3.412109375, 3.578125, 3.744140625, 3.91015625, 4.076171875, 4.2421875]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 2.0, 7.0, 14.0, 13.0, 29.0, 46.0, 60.0, 85.0, 110.0, 191.0, 242.0, 364.0, 519.0, 720.0, 1137.0, 1540.0, 2265.0, 3384.0, 4838.0, 7391.0, 10979.0, 16461.0, 24432.0, 37086.0, 56146.0, 87430.0, 130522.0, 171932.0, 158227.0, 113185.0, 74671.0, 48235.0, 31832.0, 21042.0, 14026.0, 9492.0, 6240.0, 4304.0, 2913.0, 1946.0, 1404.0, 934.0, 659.0, 475.0, 321.0, 234.0, 148.0, 101.0, 84.0, 58.0, 31.0, 25.0, 13.0, 8.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.34619140625, -0.3349571228027344, -0.32372283935546875, -0.3124885559082031, -0.3012542724609375, -0.2900199890136719, -0.27878570556640625, -0.2675514221191406, -0.256317138671875, -0.24508285522460938, -0.23384857177734375, -0.22261428833007812, -0.2113800048828125, -0.20014572143554688, -0.18891143798828125, -0.17767715454101562, -0.16644287109375, -0.15520858764648438, -0.14397430419921875, -0.13274002075195312, -0.1215057373046875, -0.11027145385742188, -0.09903717041015625, -0.08780288696289062, -0.076568603515625, -0.06533432006835938, -0.05410003662109375, -0.042865753173828125, -0.0316314697265625, -0.020397186279296875, -0.00916290283203125, 0.002071380615234375, 0.0133056640625, 0.024539947509765625, 0.03577423095703125, 0.047008514404296875, 0.0582427978515625, 0.06947708129882812, 0.08071136474609375, 0.09194564819335938, 0.103179931640625, 0.11441421508789062, 0.12564849853515625, 0.13688278198242188, 0.1481170654296875, 0.15935134887695312, 0.17058563232421875, 0.18181991577148438, 0.19305419921875, 0.20428848266601562, 0.21552276611328125, 0.22675704956054688, 0.2379913330078125, 0.24922561645507812, 0.26045989990234375, 0.2716941833496094, 0.282928466796875, 0.2941627502441406, 0.30539703369140625, 0.3166313171386719, 0.3278656005859375, 0.3390998840332031, 0.35033416748046875, 0.3615684509277344, 0.372802734375]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 4.0, 3.0, 5.0, 4.0, 5.0, 5.0, 10.0, 8.0, 14.0, 18.0, 16.0, 14.0, 19.0, 30.0, 31.0, 27.0, 32.0, 29.0, 46.0, 42.0, 40.0, 38.0, 47.0, 1066.0, 33.0, 33.0, 48.0, 41.0, 35.0, 32.0, 21.0, 34.0, 32.0, 25.0, 14.0, 29.0, 18.0, 14.0, 10.0, 16.0, 8.0, 8.0, 9.0, 8.0, 3.0, 3.0, 1.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.287109375, -2.214141845703125, -2.14117431640625, -2.068206787109375, -1.9952392578125, -1.922271728515625, -1.84930419921875, -1.776336669921875, -1.703369140625, -1.630401611328125, -1.55743408203125, -1.484466552734375, -1.4114990234375, -1.338531494140625, -1.26556396484375, -1.192596435546875, -1.11962890625, -1.046661376953125, -0.97369384765625, -0.900726318359375, -0.8277587890625, -0.754791259765625, -0.68182373046875, -0.608856201171875, -0.535888671875, -0.462921142578125, -0.38995361328125, -0.316986083984375, -0.2440185546875, -0.171051025390625, -0.09808349609375, -0.025115966796875, 0.0478515625, 0.120819091796875, 0.19378662109375, 0.266754150390625, 0.3397216796875, 0.412689208984375, 0.48565673828125, 0.558624267578125, 0.631591796875, 0.704559326171875, 0.77752685546875, 0.850494384765625, 0.9234619140625, 0.996429443359375, 1.06939697265625, 1.142364501953125, 1.21533203125, 1.288299560546875, 1.36126708984375, 1.434234619140625, 1.5072021484375, 1.580169677734375, 1.65313720703125, 1.726104736328125, 1.799072265625, 1.872039794921875, 1.94500732421875, 2.017974853515625, 2.0909423828125, 2.163909912109375, 2.23687744140625, 2.309844970703125, 2.3828125]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 6.0, 6.0, 4.0, 11.0, 14.0, 23.0, 36.0, 58.0, 92.0, 102.0, 189.0, 303.0, 514.0, 755.0, 1359.0, 2123.0, 3583.0, 5903.0, 9968.0, 16434.0, 26980.0, 44670.0, 72015.0, 111197.0, 154575.0, 1220992.0, 148644.0, 103884.0, 67155.0, 41641.0, 25327.0, 15238.0, 9227.0, 5613.0, 3340.0, 2023.0, 1206.0, 734.0, 445.0, 258.0, 176.0, 96.0, 74.0, 52.0, 28.0, 20.0, 15.0, 14.0, 8.0, 6.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.284423828125, -0.2753715515136719, -0.26631927490234375, -0.2572669982910156, -0.2482147216796875, -0.23916244506835938, -0.23011016845703125, -0.22105789184570312, -0.212005615234375, -0.20295333862304688, -0.19390106201171875, -0.18484878540039062, -0.1757965087890625, -0.16674423217773438, -0.15769195556640625, -0.14863967895507812, -0.13958740234375, -0.13053512573242188, -0.12148284912109375, -0.11243057250976562, -0.1033782958984375, -0.09432601928710938, -0.08527374267578125, -0.07622146606445312, -0.067169189453125, -0.058116912841796875, -0.04906463623046875, -0.040012359619140625, -0.0309600830078125, -0.021907806396484375, -0.01285552978515625, -0.003803253173828125, 0.0052490234375, 0.014301300048828125, 0.02335357666015625, 0.032405853271484375, 0.0414581298828125, 0.050510406494140625, 0.05956268310546875, 0.06861495971679688, 0.077667236328125, 0.08671951293945312, 0.09577178955078125, 0.10482406616210938, 0.1138763427734375, 0.12292861938476562, 0.13198089599609375, 0.14103317260742188, 0.15008544921875, 0.15913772583007812, 0.16819000244140625, 0.17724227905273438, 0.1862945556640625, 0.19534683227539062, 0.20439910888671875, 0.21345138549804688, 0.222503662109375, 0.23155593872070312, 0.24060821533203125, 0.24966049194335938, 0.2587127685546875, 0.2677650451660156, 0.27681732177734375, 0.2858695983886719, 0.294921875]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 5.0, 4.0, 4.0, 5.0, 9.0, 11.0, 4.0, 20.0, 16.0, 12.0, 30.0, 38.0, 44.0, 42.0, 59.0, 65.0, 57.0, 56.0, 71.0, 75.0, 47.0, 58.0, 42.0, 54.0, 35.0, 30.0, 21.0, 12.0, 17.0, 14.0, 8.0, 10.0, 13.0, 3.0, 3.0, 1.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0020160675048828125, -0.0019510090351104736, -0.0018859505653381348, -0.001820892095565796, -0.001755833625793457, -0.0016907751560211182, -0.0016257166862487793, -0.0015606582164764404, -0.0014955997467041016, -0.0014305412769317627, -0.0013654828071594238, -0.001300424337387085, -0.001235365867614746, -0.0011703073978424072, -0.0011052489280700684, -0.0010401904582977295, -0.0009751319885253906, -0.0009100735187530518, -0.0008450150489807129, -0.000779956579208374, -0.0007148981094360352, -0.0006498396396636963, -0.0005847811698913574, -0.0005197227001190186, -0.0004546642303466797, -0.0003896057605743408, -0.00032454729080200195, -0.0002594888210296631, -0.00019443035125732422, -0.00012937188148498535, -6.431341171264648e-05, 7.450580596923828e-07, 6.580352783203125e-05, 0.00013086199760437012, 0.00019592046737670898, 0.00026097893714904785, 0.0003260374069213867, 0.0003910958766937256, 0.00045615434646606445, 0.0005212128162384033, 0.0005862712860107422, 0.0006513297557830811, 0.0007163882255554199, 0.0007814466953277588, 0.0008465051651000977, 0.0009115636348724365, 0.0009766221046447754, 0.0010416805744171143, 0.0011067390441894531, 0.001171797513961792, 0.0012368559837341309, 0.0013019144535064697, 0.0013669729232788086, 0.0014320313930511475, 0.0014970898628234863, 0.0015621483325958252, 0.001627206802368164, 0.001692265272140503, 0.0017573237419128418, 0.0018223822116851807, 0.0018874406814575195, 0.0019524991512298584, 0.0020175576210021973, 0.002082616090774536, 0.002147674560546875]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 4.0, 3.0, 9.0, 9.0, 15.0, 10.0, 13.0, 13.0, 22.0, 29.0, 39.0, 45.0, 49.0, 74.0, 103.0, 141.0, 137.0, 191.0, 344.0, 716.0, 5486.0, 1028896.0, 9972.0, 807.0, 412.0, 256.0, 158.0, 129.0, 107.0, 78.0, 45.0, 49.0, 28.0, 30.0, 20.0, 27.0, 28.0, 12.0, 6.0, 8.0, 10.0, 5.0, 5.0, 3.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.0401611328125, -0.038999080657958984, -0.03783702850341797, -0.03667497634887695, -0.03551292419433594, -0.03435087203979492, -0.033188819885253906, -0.03202676773071289, -0.030864715576171875, -0.02970266342163086, -0.028540611267089844, -0.027378559112548828, -0.026216506958007812, -0.025054454803466797, -0.02389240264892578, -0.022730350494384766, -0.02156829833984375, -0.020406246185302734, -0.01924419403076172, -0.018082141876220703, -0.016920089721679688, -0.015758037567138672, -0.014595985412597656, -0.01343393325805664, -0.012271881103515625, -0.01110982894897461, -0.009947776794433594, -0.008785724639892578, -0.0076236724853515625, -0.006461620330810547, -0.005299568176269531, -0.004137516021728516, -0.0029754638671875, -0.0018134117126464844, -0.0006513595581054688, 0.0005106925964355469, 0.0016727447509765625, 0.002834796905517578, 0.003996849060058594, 0.005158901214599609, 0.006320953369140625, 0.007483005523681641, 0.008645057678222656, 0.009807109832763672, 0.010969161987304688, 0.012131214141845703, 0.013293266296386719, 0.014455318450927734, 0.01561737060546875, 0.016779422760009766, 0.01794147491455078, 0.019103527069091797, 0.020265579223632812, 0.021427631378173828, 0.022589683532714844, 0.02375173568725586, 0.024913787841796875, 0.02607583999633789, 0.027237892150878906, 0.028399944305419922, 0.029561996459960938, 0.030724048614501953, 0.03188610076904297, 0.033048152923583984, 0.034210205078125]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 979.0, 34.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.028607146814465523, -0.027993997558951378, -0.027380848303437233, -0.026767700910568237, -0.026154551655054092, -0.025541402399539948, -0.024928253144025803, -0.024315103888511658, -0.023701954632997513, -0.023088805377483368, -0.022475656121969223, -0.021862506866455078, -0.021249359473586082, -0.020636210218071938, -0.020023060962557793, -0.019409911707043648, -0.018796764314174652, -0.018183615058660507, -0.017570465803146362, -0.016957316547632217, -0.016344169154763222, -0.015731019899249077, -0.015117870643734932, -0.014504721388220787, -0.013891572132706642, -0.013278422877192497, -0.012665274553000927, -0.012052125297486782, -0.011438976041972637, -0.010825827717781067, -0.010212678462266922, -0.009599529206752777, -0.008986380882561207, -0.008373231627047062, -0.007760082837194204, -0.007146934047341347, -0.006533784791827202, -0.005920636001974344, -0.005307487212121487, -0.004694337956607342, -0.004081189166754484, -0.003468040144070983, -0.0028548911213874817, -0.002241742331534624, -0.0016285933088511229, -0.0010154442861676216, -0.000402295496314764, 0.00021085375919938087, 0.0008240025490522385, 0.0014371515717357397, 0.002050300594419241, 0.0026634493842720985, 0.0032765984069556, 0.003889747429639101, 0.004502896219491959, 0.0051160454750061035, 0.005729194264858961, 0.006342343054711819, 0.006955492310225964, 0.007568641100078821, 0.008181789889931679, 0.008794939145445824, 0.009408088400959969, 0.010021237656474113, 0.010634385980665684]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 9.0, 7.0, 4.0, 11.0, 10.0, 20.0, 25.0, 26.0, 53.0, 35.0, 36.0, 55.0, 59.0, 55.0, 68.0, 55.0, 69.0, 66.0, 62.0, 52.0, 51.0, 43.0, 37.0, 16.0, 22.0, 12.0, 10.0, 10.0, 5.0, 7.0, 6.0, 7.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0011274218559265137, -0.0010774759575724602, -0.0010275300592184067, -0.0009775841608643532, -0.0009276382625102997, -0.0008776923641562462, -0.0008277464658021927, -0.0007778005674481392, -0.0007278546690940857, -0.0006779087707400322, -0.0006279628723859787, -0.0005780169740319252, -0.0005280710756778717, -0.0004781251773238182, -0.0004281792789697647, -0.0003782333806157112, -0.0003282874822616577, -0.0002783415839076042, -0.00022839568555355072, -0.00017844978719949722, -0.00012850388884544373, -7.855799049139023e-05, -2.861209213733673e-05, 2.1333806216716766e-05, 7.127970457077026e-05, 0.00012122560292482376, 0.00017117150127887726, 0.00022111739963293076, 0.00027106329798698425, 0.00032100919634103775, 0.00037095509469509125, 0.00042090099304914474, 0.00047084689140319824, 0.0005207927897572517, 0.0005707386881113052, 0.0006206845864653587, 0.0006706304848194122, 0.0007205763831734657, 0.0007705222815275192, 0.0008204681798815727, 0.0008704140782356262, 0.0009203599765896797, 0.0009703058749437332, 0.0010202517732977867, 0.0010701976716518402, 0.0011201435700058937, 0.0011700894683599472, 0.0012200353667140007, 0.0012699812650680542, 0.0013199271634221077, 0.0013698730617761612, 0.0014198189601302147, 0.0014697648584842682, 0.0015197107568383217, 0.0015696566551923752, 0.0016196025535464287, 0.0016695484519004822, 0.0017194943502545357, 0.0017694402486085892, 0.0018193861469626427, 0.0018693320453166962, 0.0019192779436707497, 0.001969223842024803, 0.0020191697403788567, 0.00206911563873291]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 7.0, 4.0, 4.0, 16.0, 20.0, 17.0, 28.0, 26.0, 46.0, 33.0, 54.0, 58.0, 44.0, 50.0, 50.0, 70.0, 60.0, 62.0, 52.0, 41.0, 55.0, 30.0, 42.0, 39.0, 31.0, 16.0, 18.0, 13.0, 10.0, 3.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.3828125, -6.216796875, -6.05078125, -5.884765625, -5.71875, -5.552734375, -5.38671875, -5.220703125, -5.0546875, -4.888671875, -4.72265625, -4.556640625, -4.390625, -4.224609375, -4.05859375, -3.892578125, -3.7265625, -3.560546875, -3.39453125, -3.228515625, -3.0625, -2.896484375, -2.73046875, -2.564453125, -2.3984375, -2.232421875, -2.06640625, -1.900390625, -1.734375, -1.568359375, -1.40234375, -1.236328125, -1.0703125, -0.904296875, -0.73828125, -0.572265625, -0.40625, -0.240234375, -0.07421875, 0.091796875, 0.2578125, 0.423828125, 0.58984375, 0.755859375, 0.921875, 1.087890625, 1.25390625, 1.419921875, 1.5859375, 1.751953125, 1.91796875, 2.083984375, 2.25, 2.416015625, 2.58203125, 2.748046875, 2.9140625, 3.080078125, 3.24609375, 3.412109375, 3.578125, 3.744140625, 3.91015625, 4.076171875, 4.2421875]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 5.0, 4.0, 6.0, 13.0, 5.0, 13.0, 26.0, 29.0, 33.0, 64.0, 62.0, 131.0, 181.0, 224.0, 401.0, 512.0, 884.0, 1401.0, 2391.0, 3829.0, 6746.0, 13246.0, 34029.0, 348266.0, 559734.0, 42755.0, 15040.0, 7447.0, 4349.0, 2382.0, 1483.0, 962.0, 613.0, 397.0, 273.0, 188.0, 137.0, 84.0, 57.0, 46.0, 27.0, 29.0, 14.0, 16.0, 12.0, 6.0, 1.0, 2.0, 4.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.65625, -18.07470703125, -17.4931640625, -16.91162109375, -16.330078125, -15.74853515625, -15.1669921875, -14.58544921875, -14.00390625, -13.42236328125, -12.8408203125, -12.25927734375, -11.677734375, -11.09619140625, -10.5146484375, -9.93310546875, -9.3515625, -8.77001953125, -8.1884765625, -7.60693359375, -7.025390625, -6.44384765625, -5.8623046875, -5.28076171875, -4.69921875, -4.11767578125, -3.5361328125, -2.95458984375, -2.373046875, -1.79150390625, -1.2099609375, -0.62841796875, -0.046875, 0.53466796875, 1.1162109375, 1.69775390625, 2.279296875, 2.86083984375, 3.4423828125, 4.02392578125, 4.60546875, 5.18701171875, 5.7685546875, 6.35009765625, 6.931640625, 7.51318359375, 8.0947265625, 8.67626953125, 9.2578125, 9.83935546875, 10.4208984375, 11.00244140625, 11.583984375, 12.16552734375, 12.7470703125, 13.32861328125, 13.91015625, 14.49169921875, 15.0732421875, 15.65478515625, 16.236328125, 16.81787109375, 17.3994140625, 17.98095703125, 18.5625]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 4.0, 6.0, 2.0, 5.0, 7.0, 8.0, 10.0, 11.0, 16.0, 24.0, 14.0, 30.0, 32.0, 29.0, 40.0, 37.0, 46.0, 60.0, 56.0, 113.0, 412.0, 1511.0, 162.0, 57.0, 53.0, 49.0, 47.0, 29.0, 47.0, 25.0, 18.0, 19.0, 19.0, 17.0, 9.0, 10.0, 6.0, 5.0, 4.0, 5.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-15.765625, -15.3408203125, -14.916015625, -14.4912109375, -14.06640625, -13.6416015625, -13.216796875, -12.7919921875, -12.3671875, -11.9423828125, -11.517578125, -11.0927734375, -10.66796875, -10.2431640625, -9.818359375, -9.3935546875, -8.96875, -8.5439453125, -8.119140625, -7.6943359375, -7.26953125, -6.8447265625, -6.419921875, -5.9951171875, -5.5703125, -5.1455078125, -4.720703125, -4.2958984375, -3.87109375, -3.4462890625, -3.021484375, -2.5966796875, -2.171875, -1.7470703125, -1.322265625, -0.8974609375, -0.47265625, -0.0478515625, 0.376953125, 0.8017578125, 1.2265625, 1.6513671875, 2.076171875, 2.5009765625, 2.92578125, 3.3505859375, 3.775390625, 4.2001953125, 4.625, 5.0498046875, 5.474609375, 5.8994140625, 6.32421875, 6.7490234375, 7.173828125, 7.5986328125, 8.0234375, 8.4482421875, 8.873046875, 9.2978515625, 9.72265625, 10.1474609375, 10.572265625, 10.9970703125, 11.421875]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 5.0, 9.0, 10.0, 11.0, 7.0, 21.0, 13.0, 31.0, 18.0, 39.0, 31.0, 62.0, 62.0, 130.0, 273.0, 1353.0, 2075228.0, 1066373.0, 1222.0, 291.0, 141.0, 86.0, 59.0, 36.0, 35.0, 25.0, 21.0, 22.0, 14.0, 17.0, 19.0, 4.0, 8.0, 7.0, 6.0, 3.0, 4.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.53125, -47.69580078125, -45.8603515625, -44.02490234375, -42.189453125, -40.35400390625, -38.5185546875, -36.68310546875, -34.84765625, -33.01220703125, -31.1767578125, -29.34130859375, -27.505859375, -25.67041015625, -23.8349609375, -21.99951171875, -20.1640625, -18.32861328125, -16.4931640625, -14.65771484375, -12.822265625, -10.98681640625, -9.1513671875, -7.31591796875, -5.48046875, -3.64501953125, -1.8095703125, 0.02587890625, 1.861328125, 3.69677734375, 5.5322265625, 7.36767578125, 9.203125, 11.03857421875, 12.8740234375, 14.70947265625, 16.544921875, 18.38037109375, 20.2158203125, 22.05126953125, 23.88671875, 25.72216796875, 27.5576171875, 29.39306640625, 31.228515625, 33.06396484375, 34.8994140625, 36.73486328125, 38.5703125, 40.40576171875, 42.2412109375, 44.07666015625, 45.912109375, 47.74755859375, 49.5830078125, 51.41845703125, 53.25390625, 55.08935546875, 56.9248046875, 58.76025390625, 60.595703125, 62.43115234375, 64.2666015625, 66.10205078125, 67.9375]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 94.0, 612.0, 286.0, 18.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.560911178588867, -9.121329307556152, -6.6817474365234375, -4.242165565490723, -1.8025836944580078, 0.636998176574707, 3.076580047607422, 5.51616096496582, 7.955743789672852, 10.395325660705566, 12.834907531738281, 15.274489402770996, 17.71407127380371, 20.15365219116211, 22.59323501586914, 25.03281593322754, 27.47239875793457, 29.91197967529297, 32.3515625, 34.79114532470703, 37.23072814941406, 39.67030715942383, 42.10988998413086, 44.549468994140625, 46.989051818847656, 49.42863464355469, 51.86821746826172, 54.307796478271484, 56.747379302978516, 59.18696212768555, 61.62654113769531, 64.06612396240234, 66.50570678710938, 68.9452896118164, 71.38487243652344, 73.82445526123047, 76.2640380859375, 78.70361328125, 81.14319610595703, 83.58277893066406, 86.0223617553711, 88.46194458007812, 90.90152740478516, 93.34111022949219, 95.78068542480469, 98.22026824951172, 100.65985107421875, 103.09943389892578, 105.53901672363281, 107.97859954833984, 110.41818237304688, 112.8577651977539, 115.29734802246094, 117.73692321777344, 120.17650604248047, 122.6160888671875, 125.05567169189453, 127.49525451660156, 129.93482971191406, 132.37442016601562, 134.81399536132812, 137.2535858154297, 139.6931610107422, 142.13275146484375, 144.57232666015625]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 6.0, 2.0, 2.0, 9.0, 10.0, 9.0, 16.0, 12.0, 14.0, 19.0, 18.0, 24.0, 26.0, 29.0, 21.0, 35.0, 32.0, 33.0, 36.0, 41.0, 35.0, 40.0, 44.0, 53.0, 38.0, 41.0, 34.0, 32.0, 38.0, 47.0, 37.0, 26.0, 22.0, 18.0, 22.0, 15.0, 11.0, 12.0, 12.0, 10.0, 7.0, 9.0, 5.0, 3.0, 2.0, 3.0, 0.0, 3.0, 2.0], "bins": [-46.899314880371094, -45.650611877441406, -44.40190505981445, -43.153202056884766, -41.90449905395508, -40.655792236328125, -39.40708923339844, -38.15838623046875, -36.9096794128418, -35.66097640991211, -34.412269592285156, -33.16356658935547, -31.91486167907715, -30.666156768798828, -29.41745376586914, -28.16874885559082, -26.920045852661133, -25.671340942382812, -24.422637939453125, -23.173933029174805, -21.925228118896484, -20.676525115966797, -19.427820205688477, -18.179115295410156, -16.93041229248047, -15.681708335876465, -14.433003425598145, -13.18429946899414, -11.93559455871582, -10.686890602111816, -9.438186645507812, -8.189481735229492, -6.940776824951172, -5.69207239151001, -4.443367958068848, -3.1946640014648438, -1.9459595680236816, -0.6972551345825195, 0.5514488220214844, 1.8001537322998047, 3.0488576889038086, 4.297562122344971, 5.546266555786133, 6.794970512390137, 8.04367446899414, 9.292379379272461, 10.541083335876465, 11.789788246154785, 13.038492202758789, 14.287196159362793, 15.535901069641113, 16.784605026245117, 18.033309936523438, 19.282012939453125, 20.530717849731445, 21.779422760009766, 23.028125762939453, 24.276830673217773, 25.52553367614746, 26.77423858642578, 28.0229434967041, 29.271648406982422, 30.52035140991211, 31.76905632019043, 33.01776123046875]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 7.0, 10.0, 12.0, 20.0, 21.0, 20.0, 40.0, 35.0, 36.0, 51.0, 49.0, 49.0, 35.0, 61.0, 72.0, 49.0, 55.0, 53.0, 37.0, 45.0, 52.0, 28.0, 35.0, 32.0, 34.0, 22.0, 16.0, 7.0, 3.0, 7.0, 6.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.390625, -6.2210693359375, -6.051513671875, -5.8819580078125, -5.71240234375, -5.5428466796875, -5.373291015625, -5.2037353515625, -5.0341796875, -4.8646240234375, -4.695068359375, -4.5255126953125, -4.35595703125, -4.1864013671875, -4.016845703125, -3.8472900390625, -3.677734375, -3.5081787109375, -3.338623046875, -3.1690673828125, -2.99951171875, -2.8299560546875, -2.660400390625, -2.4908447265625, -2.3212890625, -2.1517333984375, -1.982177734375, -1.8126220703125, -1.64306640625, -1.4735107421875, -1.303955078125, -1.1343994140625, -0.96484375, -0.7952880859375, -0.625732421875, -0.4561767578125, -0.28662109375, -0.1170654296875, 0.052490234375, 0.2220458984375, 0.3916015625, 0.5611572265625, 0.730712890625, 0.9002685546875, 1.06982421875, 1.2393798828125, 1.408935546875, 1.5784912109375, 1.748046875, 1.9176025390625, 2.087158203125, 2.2567138671875, 2.42626953125, 2.5958251953125, 2.765380859375, 2.9349365234375, 3.1044921875, 3.2740478515625, 3.443603515625, 3.6131591796875, 3.78271484375, 3.9522705078125, 4.121826171875, 4.2913818359375, 4.4609375]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 3.0, 2.0, 9.0, 9.0, 14.0, 20.0, 40.0, 78.0, 90.0, 179.0, 303.0, 581.0, 1442.0, 4561.0, 24196.0, 390990.0, 3632661.0, 120839.0, 13014.0, 3091.0, 1052.0, 488.0, 227.0, 145.0, 89.0, 70.0, 35.0, 20.0, 15.0, 12.0, 9.0, 6.0, 2.0, 1.0, 0.0, 1.0], "bins": [-40.375, -39.46435546875, -38.5537109375, -37.64306640625, -36.732421875, -35.82177734375, -34.9111328125, -34.00048828125, -33.08984375, -32.17919921875, -31.2685546875, -30.35791015625, -29.447265625, -28.53662109375, -27.6259765625, -26.71533203125, -25.8046875, -24.89404296875, -23.9833984375, -23.07275390625, -22.162109375, -21.25146484375, -20.3408203125, -19.43017578125, -18.51953125, -17.60888671875, -16.6982421875, -15.78759765625, -14.876953125, -13.96630859375, -13.0556640625, -12.14501953125, -11.234375, -10.32373046875, -9.4130859375, -8.50244140625, -7.591796875, -6.68115234375, -5.7705078125, -4.85986328125, -3.94921875, -3.03857421875, -2.1279296875, -1.21728515625, -0.306640625, 0.60400390625, 1.5146484375, 2.42529296875, 3.3359375, 4.24658203125, 5.1572265625, 6.06787109375, 6.978515625, 7.88916015625, 8.7998046875, 9.71044921875, 10.62109375, 11.53173828125, 12.4423828125, 13.35302734375, 14.263671875, 15.17431640625, 16.0849609375, 16.99560546875, 17.90625]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 5.0, 1.0, 10.0, 9.0, 30.0, 37.0, 71.0, 116.0, 154.0, 259.0, 422.0, 640.0, 763.0, 603.0, 369.0, 234.0, 130.0, 73.0, 61.0, 41.0, 23.0, 9.0, 9.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.359375, -18.6533203125, -17.947265625, -17.2412109375, -16.53515625, -15.8291015625, -15.123046875, -14.4169921875, -13.7109375, -13.0048828125, -12.298828125, -11.5927734375, -10.88671875, -10.1806640625, -9.474609375, -8.7685546875, -8.0625, -7.3564453125, -6.650390625, -5.9443359375, -5.23828125, -4.5322265625, -3.826171875, -3.1201171875, -2.4140625, -1.7080078125, -1.001953125, -0.2958984375, 0.41015625, 1.1162109375, 1.822265625, 2.5283203125, 3.234375, 3.9404296875, 4.646484375, 5.3525390625, 6.05859375, 6.7646484375, 7.470703125, 8.1767578125, 8.8828125, 9.5888671875, 10.294921875, 11.0009765625, 11.70703125, 12.4130859375, 13.119140625, 13.8251953125, 14.53125, 15.2373046875, 15.943359375, 16.6494140625, 17.35546875, 18.0615234375, 18.767578125, 19.4736328125, 20.1796875, 20.8857421875, 21.591796875, 22.2978515625, 23.00390625, 23.7099609375, 24.416015625, 25.1220703125, 25.828125]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 1.0, 12.0, 7.0, 8.0, 25.0, 18.0, 45.0, 56.0, 105.0, 176.0, 377.0, 1285.0, 16107.0, 3893395.0, 277834.0, 3443.0, 669.0, 327.0, 142.0, 76.0, 61.0, 17.0, 30.0, 18.0, 13.0, 12.0, 6.0, 4.0, 3.0, 6.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.65625, -44.40869140625, -42.1611328125, -39.91357421875, -37.666015625, -35.41845703125, -33.1708984375, -30.92333984375, -28.67578125, -26.42822265625, -24.1806640625, -21.93310546875, -19.685546875, -17.43798828125, -15.1904296875, -12.94287109375, -10.6953125, -8.44775390625, -6.2001953125, -3.95263671875, -1.705078125, 0.54248046875, 2.7900390625, 5.03759765625, 7.28515625, 9.53271484375, 11.7802734375, 14.02783203125, 16.275390625, 18.52294921875, 20.7705078125, 23.01806640625, 25.265625, 27.51318359375, 29.7607421875, 32.00830078125, 34.255859375, 36.50341796875, 38.7509765625, 40.99853515625, 43.24609375, 45.49365234375, 47.7412109375, 49.98876953125, 52.236328125, 54.48388671875, 56.7314453125, 58.97900390625, 61.2265625, 63.47412109375, 65.7216796875, 67.96923828125, 70.216796875, 72.46435546875, 74.7119140625, 76.95947265625, 79.20703125, 81.45458984375, 83.7021484375, 85.94970703125, 88.197265625, 90.44482421875, 92.6923828125, 94.93994140625, 97.1875]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 36.0, 151.0, 460.0, 280.0, 77.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-169.6538848876953, -163.9443359375, -158.23477172851562, -152.5252227783203, -146.815673828125, -141.10610961914062, -135.3965606689453, -129.68701171875, -123.97745513916016, -118.26789855957031, -112.558349609375, -106.84879302978516, -101.13923645019531, -95.4296875, -89.72013092041016, -84.01057434082031, -78.301025390625, -72.59146881103516, -66.88191986083984, -61.17236328125, -55.46281051635742, -49.753257751464844, -44.043701171875, -38.33414840698242, -32.624595642089844, -26.915042877197266, -21.205488204956055, -15.495933532714844, -9.786380767822266, -4.0768280029296875, 1.6327285766601562, 7.342281341552734, 13.051849365234375, 18.761402130126953, 24.470956802368164, 30.180511474609375, 35.89006423950195, 41.59961700439453, 47.309173583984375, 53.01872634887695, 58.72827911376953, 64.43783569335938, 70.14738464355469, 75.85694122314453, 81.56649780273438, 87.27604675292969, 92.98560333251953, 98.69515991210938, 104.40470886230469, 110.11426544189453, 115.82381439208984, 121.53337097167969, 127.242919921875, 132.95248413085938, 138.6620330810547, 144.37158203125, 150.08114624023438, 155.7906951904297, 161.50025939941406, 167.20980834960938, 172.9193572998047, 178.62890625, 184.33847045898438, 190.0480194091797, 195.757568359375]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 4.0, 3.0, 6.0, 7.0, 8.0, 20.0, 14.0, 24.0, 19.0, 18.0, 19.0, 35.0, 44.0, 42.0, 42.0, 53.0, 51.0, 48.0, 38.0, 44.0, 48.0, 47.0, 32.0, 43.0, 23.0, 41.0, 29.0, 32.0, 24.0, 38.0, 21.0, 16.0, 13.0, 15.0, 2.0, 9.0, 10.0, 4.0, 5.0, 7.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.267303466796875, -51.675743103027344, -50.08417892456055, -48.492618560791016, -46.90105438232422, -45.30949401855469, -43.717933654785156, -42.126373291015625, -40.53480911254883, -38.9432487487793, -37.3516845703125, -35.76012420654297, -34.16856384277344, -32.57699966430664, -30.98543930053711, -29.393877029418945, -27.80231475830078, -26.210752487182617, -24.619190216064453, -23.027629852294922, -21.436067581176758, -19.844505310058594, -18.252944946289062, -16.6613826751709, -15.069820404052734, -13.47825813293457, -11.886696815490723, -10.295135498046875, -8.703573226928711, -7.112011432647705, -5.520449638366699, -3.9288883209228516, -2.3373260498046875, -0.7457642555236816, 0.8457975387573242, 2.43735933303833, 4.028921127319336, 5.620482921600342, 7.212044715881348, 8.803606033325195, 10.39516830444336, 11.986730575561523, 13.578291893005371, 15.169853210449219, 16.761415481567383, 18.352977752685547, 19.944538116455078, 21.536100387573242, 23.127662658691406, 24.71922492980957, 26.310787200927734, 27.902347564697266, 29.49390983581543, 31.085472106933594, 32.677032470703125, 34.268592834472656, 35.86015701293945, 37.451717376708984, 39.04328155517578, 40.63484191894531, 42.226402282714844, 43.81796646118164, 45.40952682495117, 47.00109100341797, 48.5926513671875]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 6.0, 7.0, 6.0, 14.0, 8.0, 14.0, 20.0, 22.0, 41.0, 27.0, 35.0, 49.0, 51.0, 37.0, 41.0, 57.0, 55.0, 53.0, 55.0, 50.0, 49.0, 40.0, 48.0, 35.0, 34.0, 28.0, 25.0, 23.0, 24.0, 25.0, 12.0, 3.0, 4.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.37109375, -5.20849609375, -5.0458984375, -4.88330078125, -4.720703125, -4.55810546875, -4.3955078125, -4.23291015625, -4.0703125, -3.90771484375, -3.7451171875, -3.58251953125, -3.419921875, -3.25732421875, -3.0947265625, -2.93212890625, -2.76953125, -2.60693359375, -2.4443359375, -2.28173828125, -2.119140625, -1.95654296875, -1.7939453125, -1.63134765625, -1.46875, -1.30615234375, -1.1435546875, -0.98095703125, -0.818359375, -0.65576171875, -0.4931640625, -0.33056640625, -0.16796875, -0.00537109375, 0.1572265625, 0.31982421875, 0.482421875, 0.64501953125, 0.8076171875, 0.97021484375, 1.1328125, 1.29541015625, 1.4580078125, 1.62060546875, 1.783203125, 1.94580078125, 2.1083984375, 2.27099609375, 2.43359375, 2.59619140625, 2.7587890625, 2.92138671875, 3.083984375, 3.24658203125, 3.4091796875, 3.57177734375, 3.734375, 3.89697265625, 4.0595703125, 4.22216796875, 4.384765625, 4.54736328125, 4.7099609375, 4.87255859375, 5.03515625]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 3.0, 4.0, 6.0, 10.0, 10.0, 23.0, 25.0, 37.0, 63.0, 99.0, 149.0, 189.0, 300.0, 470.0, 723.0, 1155.0, 1642.0, 2769.0, 4415.0, 6930.0, 11315.0, 18100.0, 29291.0, 48200.0, 79185.0, 126807.0, 179916.0, 186340.0, 133353.0, 84004.0, 50657.0, 31157.0, 19255.0, 11853.0, 7508.0, 4510.0, 2835.0, 1842.0, 1213.0, 736.0, 518.0, 313.0, 173.0, 175.0, 102.0, 70.0, 32.0, 27.0, 21.0, 16.0, 8.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.398681640625, -0.3854179382324219, -0.37215423583984375, -0.3588905334472656, -0.3456268310546875, -0.3323631286621094, -0.31909942626953125, -0.3058357238769531, -0.292572021484375, -0.2793083190917969, -0.26604461669921875, -0.2527809143066406, -0.2395172119140625, -0.22625350952148438, -0.21298980712890625, -0.19972610473632812, -0.18646240234375, -0.17319869995117188, -0.15993499755859375, -0.14667129516601562, -0.1334075927734375, -0.12014389038085938, -0.10688018798828125, -0.09361648559570312, -0.080352783203125, -0.06708908081054688, -0.05382537841796875, -0.040561676025390625, -0.0272979736328125, -0.014034271240234375, -0.00077056884765625, 0.012493133544921875, 0.0257568359375, 0.039020538330078125, 0.05228424072265625, 0.06554794311523438, 0.0788116455078125, 0.09207534790039062, 0.10533905029296875, 0.11860275268554688, 0.131866455078125, 0.14513015747070312, 0.15839385986328125, 0.17165756225585938, 0.1849212646484375, 0.19818496704101562, 0.21144866943359375, 0.22471237182617188, 0.23797607421875, 0.2512397766113281, 0.26450347900390625, 0.2777671813964844, 0.2910308837890625, 0.3042945861816406, 0.31755828857421875, 0.3308219909667969, 0.344085693359375, 0.3573493957519531, 0.37061309814453125, 0.3838768005371094, 0.3971405029296875, 0.4104042053222656, 0.42366790771484375, 0.4369316101074219, 0.4501953125]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 3.0, 5.0, 2.0, 7.0, 12.0, 11.0, 12.0, 21.0, 13.0, 16.0, 20.0, 28.0, 48.0, 36.0, 35.0, 49.0, 57.0, 51.0, 41.0, 1070.0, 53.0, 56.0, 53.0, 45.0, 32.0, 30.0, 38.0, 30.0, 27.0, 28.0, 23.0, 24.0, 7.0, 10.0, 9.0, 9.0, 17.0, 1.0, 5.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.328125, -3.231353759765625, -3.13458251953125, -3.037811279296875, -2.9410400390625, -2.844268798828125, -2.74749755859375, -2.650726318359375, -2.553955078125, -2.457183837890625, -2.36041259765625, -2.263641357421875, -2.1668701171875, -2.070098876953125, -1.97332763671875, -1.876556396484375, -1.77978515625, -1.683013916015625, -1.58624267578125, -1.489471435546875, -1.3927001953125, -1.295928955078125, -1.19915771484375, -1.102386474609375, -1.005615234375, -0.908843994140625, -0.81207275390625, -0.715301513671875, -0.6185302734375, -0.521759033203125, -0.42498779296875, -0.328216552734375, -0.2314453125, -0.134674072265625, -0.03790283203125, 0.058868408203125, 0.1556396484375, 0.252410888671875, 0.34918212890625, 0.445953369140625, 0.542724609375, 0.639495849609375, 0.73626708984375, 0.833038330078125, 0.9298095703125, 1.026580810546875, 1.12335205078125, 1.220123291015625, 1.31689453125, 1.413665771484375, 1.51043701171875, 1.607208251953125, 1.7039794921875, 1.800750732421875, 1.89752197265625, 1.994293212890625, 2.091064453125, 2.187835693359375, 2.28460693359375, 2.381378173828125, 2.4781494140625, 2.574920654296875, 2.67169189453125, 2.768463134765625, 2.865234375]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 10.0, 6.0, 16.0, 26.0, 31.0, 55.0, 90.0, 164.0, 262.0, 417.0, 658.0, 1018.0, 1716.0, 2793.0, 4563.0, 7677.0, 12990.0, 21925.0, 37430.0, 63105.0, 101756.0, 151310.0, 1231360.0, 164621.0, 115425.0, 71977.0, 43097.0, 25598.0, 14868.0, 8677.0, 5322.0, 3220.0, 1934.0, 1150.0, 706.0, 417.0, 262.0, 194.0, 93.0, 49.0, 50.0, 29.0, 21.0, 15.0, 13.0, 9.0, 3.0, 3.0, 5.0, 0.0, 4.0], "bins": [-0.363037109375, -0.35285186767578125, -0.3426666259765625, -0.33248138427734375, -0.322296142578125, -0.31211090087890625, -0.3019256591796875, -0.29174041748046875, -0.28155517578125, -0.27136993408203125, -0.2611846923828125, -0.25099945068359375, -0.240814208984375, -0.23062896728515625, -0.2204437255859375, -0.21025848388671875, -0.2000732421875, -0.18988800048828125, -0.1797027587890625, -0.16951751708984375, -0.159332275390625, -0.14914703369140625, -0.1389617919921875, -0.12877655029296875, -0.11859130859375, -0.10840606689453125, -0.0982208251953125, -0.08803558349609375, -0.077850341796875, -0.06766510009765625, -0.0574798583984375, -0.04729461669921875, -0.037109375, -0.02692413330078125, -0.0167388916015625, -0.00655364990234375, 0.003631591796875, 0.01381683349609375, 0.0240020751953125, 0.03418731689453125, 0.04437255859375, 0.05455780029296875, 0.0647430419921875, 0.07492828369140625, 0.085113525390625, 0.09529876708984375, 0.1054840087890625, 0.11566925048828125, 0.1258544921875, 0.13603973388671875, 0.1462249755859375, 0.15641021728515625, 0.166595458984375, 0.17678070068359375, 0.1869659423828125, 0.19715118408203125, 0.20733642578125, 0.21752166748046875, 0.2277069091796875, 0.23789215087890625, 0.248077392578125, 0.25826263427734375, 0.2684478759765625, 0.27863311767578125, 0.288818359375]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 4.0, 0.0, 5.0, 3.0, 7.0, 4.0, 12.0, 17.0, 18.0, 19.0, 25.0, 29.0, 34.0, 44.0, 39.0, 56.0, 48.0, 58.0, 75.0, 64.0, 67.0, 52.0, 47.0, 44.0, 38.0, 29.0, 33.0, 25.0, 24.0, 28.0, 16.0, 13.0, 11.0, 5.0, 7.0, 3.0, 4.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0023345947265625, -0.0022717267274856567, -0.0022088587284088135, -0.00214599072933197, -0.002083122730255127, -0.0020202547311782837, -0.0019573867321014404, -0.0018945187330245972, -0.001831650733947754, -0.0017687827348709106, -0.0017059147357940674, -0.0016430467367172241, -0.0015801787376403809, -0.0015173107385635376, -0.0014544427394866943, -0.001391574740409851, -0.0013287067413330078, -0.0012658387422561646, -0.0012029707431793213, -0.001140102744102478, -0.0010772347450256348, -0.0010143667459487915, -0.0009514987468719482, -0.000888630747795105, -0.0008257627487182617, -0.0007628947496414185, -0.0007000267505645752, -0.0006371587514877319, -0.0005742907524108887, -0.0005114227533340454, -0.00044855475425720215, -0.0003856867551803589, -0.0003228187561035156, -0.00025995075702667236, -0.0001970827579498291, -0.00013421475887298584, -7.134675979614258e-05, -8.478760719299316e-06, 5.4389238357543945e-05, 0.00011725723743438721, 0.00018012523651123047, 0.00024299323558807373, 0.000305861234664917, 0.00036872923374176025, 0.0004315972328186035, 0.0004944652318954468, 0.00055733323097229, 0.0006202012300491333, 0.0006830692291259766, 0.0007459372282028198, 0.0008088052272796631, 0.0008716732263565063, 0.0009345412254333496, 0.0009974092245101929, 0.0010602772235870361, 0.0011231452226638794, 0.0011860132217407227, 0.001248881220817566, 0.0013117492198944092, 0.0013746172189712524, 0.0014374852180480957, 0.001500353217124939, 0.0015632212162017822, 0.0016260892152786255, 0.0016889572143554688]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 5.0, 6.0, 6.0, 12.0, 17.0, 27.0, 34.0, 41.0, 47.0, 70.0, 72.0, 95.0, 130.0, 187.0, 300.0, 598.0, 3586.0, 1026557.0, 14843.0, 751.0, 329.0, 230.0, 129.0, 109.0, 102.0, 82.0, 47.0, 38.0, 24.0, 25.0, 16.0, 7.0, 10.0, 12.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.042236328125, -0.04085731506347656, -0.039478302001953125, -0.03809928894042969, -0.03672027587890625, -0.03534126281738281, -0.033962249755859375, -0.03258323669433594, -0.0312042236328125, -0.029825210571289062, -0.028446197509765625, -0.027067184448242188, -0.02568817138671875, -0.024309158325195312, -0.022930145263671875, -0.021551132202148438, -0.020172119140625, -0.018793106079101562, -0.017414093017578125, -0.016035079956054688, -0.01465606689453125, -0.013277053833007812, -0.011898040771484375, -0.010519027709960938, -0.0091400146484375, -0.0077610015869140625, -0.006381988525390625, -0.0050029754638671875, -0.00362396240234375, -0.0022449493408203125, -0.000865936279296875, 0.0005130767822265625, 0.00189208984375, 0.0032711029052734375, 0.004650115966796875, 0.0060291290283203125, 0.00740814208984375, 0.008787155151367188, 0.010166168212890625, 0.011545181274414062, 0.0129241943359375, 0.014303207397460938, 0.015682220458984375, 0.017061233520507812, 0.01844024658203125, 0.019819259643554688, 0.021198272705078125, 0.022577285766601562, 0.023956298828125, 0.025335311889648438, 0.026714324951171875, 0.028093338012695312, 0.02947235107421875, 0.030851364135742188, 0.032230377197265625, 0.03360939025878906, 0.0349884033203125, 0.03636741638183594, 0.037746429443359375, 0.03912544250488281, 0.04050445556640625, 0.04188346862792969, 0.043262481689453125, 0.04464149475097656, 0.0460205078125]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 524.0, 492.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02187264710664749, -0.02111779898405075, -0.02036294899880886, -0.01960810087621212, -0.01885325089097023, -0.01809840276837349, -0.01734355464577675, -0.01658870466053486, -0.01583385467529297, -0.015079005621373653, -0.014324156567454338, -0.013569308444857597, -0.012814458459615707, -0.012059610337018967, -0.011304761283099651, -0.010549912229180336, -0.009795064106583595, -0.00904021505266428, -0.008285365998744965, -0.007530517410486937, -0.006775668356567621, -0.006020819302648306, -0.005265970714390278, -0.0045111216604709625, -0.003756272606551647, -0.003001423552632332, -0.00224657473154366, -0.0014917259104549885, -0.0007368768565356731, 1.7972197383642197e-05, 0.0007728207856416702, 0.0015276698395609856, 0.00228252075612545, 0.0030373698100447655, 0.003792218631133437, 0.004547067452222109, 0.005301916506141424, 0.0060567655600607395, 0.0068116141483187675, 0.007566463202238083, 0.008321312256157398, 0.009076161310076714, 0.009831010363996029, 0.010585859417915344, 0.011340707540512085, 0.012095557525753975, 0.012850405648350716, 0.013605254702270031, 0.014360103756189346, 0.015114952810108662, 0.015869801864027977, 0.016624649986624718, 0.017379499971866608, 0.01813434809446335, 0.01888919621706009, 0.01964404620230198, 0.02039889618754387, 0.02115374431014061, 0.0219085942953825, 0.02266344241797924, 0.02341829240322113, 0.02417314052581787, 0.024927988648414612, 0.025682838633656502, 0.026437686756253242]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 4.0, 2.0, 3.0, 2.0, 3.0, 6.0, 9.0, 13.0, 9.0, 13.0, 16.0, 22.0, 33.0, 19.0, 32.0, 35.0, 48.0, 59.0, 52.0, 38.0, 50.0, 47.0, 50.0, 68.0, 54.0, 51.0, 31.0, 33.0, 30.0, 37.0, 29.0, 22.0, 18.0, 15.0, 11.0, 15.0, 8.0, 11.0, 4.0, 2.0, 2.0, 2.0, 3.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.000983893871307373, -0.0009442325681447983, -0.0009045712649822235, -0.0008649099618196487, -0.000825248658657074, -0.0007855873554944992, -0.0007459260523319244, -0.0007062647491693497, -0.0006666034460067749, -0.0006269421428442001, -0.0005872808396816254, -0.0005476195365190506, -0.0005079582333564758, -0.00046829693019390106, -0.0004286356270313263, -0.0003889743238687515, -0.00034931302070617676, -0.000309651717543602, -0.0002699904143810272, -0.00023032911121845245, -0.00019066780805587769, -0.00015100650489330292, -0.00011134520173072815, -7.168389856815338e-05, -3.202259540557861e-05, 7.638707756996155e-06, 4.730001091957092e-05, 8.696131408214569e-05, 0.00012662261724472046, 0.00016628392040729523, 0.00020594522356987, 0.00024560652673244476, 0.00028526782989501953, 0.0003249291330575943, 0.00036459043622016907, 0.00040425173938274384, 0.0004439130425453186, 0.00048357434570789337, 0.0005232356488704681, 0.0005628969520330429, 0.0006025582551956177, 0.0006422195583581924, 0.0006818808615207672, 0.000721542164683342, 0.0007612034678459167, 0.0008008647710084915, 0.0008405260741710663, 0.000880187377333641, 0.0009198486804962158, 0.0009595099836587906, 0.0009991712868213654, 0.0010388325899839401, 0.001078493893146515, 0.0011181551963090897, 0.0011578164994716644, 0.0011974778026342392, 0.001237139105796814, 0.0012768004089593887, 0.0013164617121219635, 0.0013561230152845383, 0.001395784318447113, 0.0014354456216096878, 0.0014751069247722626, 0.0015147682279348373, 0.0015544295310974121]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 6.0, 7.0, 6.0, 14.0, 8.0, 14.0, 20.0, 22.0, 41.0, 27.0, 35.0, 49.0, 51.0, 37.0, 41.0, 57.0, 55.0, 53.0, 55.0, 50.0, 49.0, 40.0, 48.0, 35.0, 34.0, 28.0, 25.0, 23.0, 24.0, 25.0, 12.0, 3.0, 4.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.37109375, -5.20849609375, -5.0458984375, -4.88330078125, -4.720703125, -4.55810546875, -4.3955078125, -4.23291015625, -4.0703125, -3.90771484375, -3.7451171875, -3.58251953125, -3.419921875, -3.25732421875, -3.0947265625, -2.93212890625, -2.76953125, -2.60693359375, -2.4443359375, -2.28173828125, -2.119140625, -1.95654296875, -1.7939453125, -1.63134765625, -1.46875, -1.30615234375, -1.1435546875, -0.98095703125, -0.818359375, -0.65576171875, -0.4931640625, -0.33056640625, -0.16796875, -0.00537109375, 0.1572265625, 0.31982421875, 0.482421875, 0.64501953125, 0.8076171875, 0.97021484375, 1.1328125, 1.29541015625, 1.4580078125, 1.62060546875, 1.783203125, 1.94580078125, 2.1083984375, 2.27099609375, 2.43359375, 2.59619140625, 2.7587890625, 2.92138671875, 3.083984375, 3.24658203125, 3.4091796875, 3.57177734375, 3.734375, 3.89697265625, 4.0595703125, 4.22216796875, 4.384765625, 4.54736328125, 4.7099609375, 4.87255859375, 5.03515625]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 4.0, 7.0, 9.0, 7.0, 9.0, 25.0, 26.0, 38.0, 69.0, 112.0, 131.0, 231.0, 328.0, 602.0, 1074.0, 2405.0, 6356.0, 23466.0, 104769.0, 502465.0, 320371.0, 62366.0, 14984.0, 4629.0, 1797.0, 882.0, 460.0, 344.0, 225.0, 131.0, 74.0, 57.0, 34.0, 32.0, 13.0, 12.0, 7.0, 5.0, 1.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.2109375, -5.05224609375, -4.8935546875, -4.73486328125, -4.576171875, -4.41748046875, -4.2587890625, -4.10009765625, -3.94140625, -3.78271484375, -3.6240234375, -3.46533203125, -3.306640625, -3.14794921875, -2.9892578125, -2.83056640625, -2.671875, -2.51318359375, -2.3544921875, -2.19580078125, -2.037109375, -1.87841796875, -1.7197265625, -1.56103515625, -1.40234375, -1.24365234375, -1.0849609375, -0.92626953125, -0.767578125, -0.60888671875, -0.4501953125, -0.29150390625, -0.1328125, 0.02587890625, 0.1845703125, 0.34326171875, 0.501953125, 0.66064453125, 0.8193359375, 0.97802734375, 1.13671875, 1.29541015625, 1.4541015625, 1.61279296875, 1.771484375, 1.93017578125, 2.0888671875, 2.24755859375, 2.40625, 2.56494140625, 2.7236328125, 2.88232421875, 3.041015625, 3.19970703125, 3.3583984375, 3.51708984375, 3.67578125, 3.83447265625, 3.9931640625, 4.15185546875, 4.310546875, 4.46923828125, 4.6279296875, 4.78662109375, 4.9453125]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 7.0, 4.0, 4.0, 4.0, 5.0, 6.0, 16.0, 16.0, 13.0, 9.0, 18.0, 21.0, 25.0, 26.0, 34.0, 39.0, 28.0, 37.0, 42.0, 52.0, 60.0, 147.0, 1772.0, 196.0, 75.0, 50.0, 36.0, 28.0, 31.0, 30.0, 35.0, 30.0, 32.0, 18.0, 12.0, 20.0, 16.0, 8.0, 13.0, 6.0, 8.0, 5.0, 7.0, 1.0, 4.0, 3.0, 2.0, 4.0, 0.0, 2.0], "bins": [-16.265625, -15.8212890625, -15.376953125, -14.9326171875, -14.48828125, -14.0439453125, -13.599609375, -13.1552734375, -12.7109375, -12.2666015625, -11.822265625, -11.3779296875, -10.93359375, -10.4892578125, -10.044921875, -9.6005859375, -9.15625, -8.7119140625, -8.267578125, -7.8232421875, -7.37890625, -6.9345703125, -6.490234375, -6.0458984375, -5.6015625, -5.1572265625, -4.712890625, -4.2685546875, -3.82421875, -3.3798828125, -2.935546875, -2.4912109375, -2.046875, -1.6025390625, -1.158203125, -0.7138671875, -0.26953125, 0.1748046875, 0.619140625, 1.0634765625, 1.5078125, 1.9521484375, 2.396484375, 2.8408203125, 3.28515625, 3.7294921875, 4.173828125, 4.6181640625, 5.0625, 5.5068359375, 5.951171875, 6.3955078125, 6.83984375, 7.2841796875, 7.728515625, 8.1728515625, 8.6171875, 9.0615234375, 9.505859375, 9.9501953125, 10.39453125, 10.8388671875, 11.283203125, 11.7275390625, 12.171875]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [5.0, 2.0, 4.0, 4.0, 1.0, 7.0, 6.0, 3.0, 5.0, 10.0, 14.0, 11.0, 10.0, 19.0, 9.0, 21.0, 28.0, 34.0, 30.0, 48.0, 45.0, 71.0, 110.0, 205.0, 430.0, 1472.0, 29980.0, 3098407.0, 12455.0, 1182.0, 415.0, 178.0, 103.0, 69.0, 51.0, 53.0, 34.0, 24.0, 32.0, 19.0, 17.0, 14.0, 16.0, 8.0, 12.0, 15.0, 8.0, 1.0, 3.0, 5.0, 4.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-25.296875, -24.374267578125, -23.45166015625, -22.529052734375, -21.6064453125, -20.683837890625, -19.76123046875, -18.838623046875, -17.916015625, -16.993408203125, -16.07080078125, -15.148193359375, -14.2255859375, -13.302978515625, -12.38037109375, -11.457763671875, -10.53515625, -9.612548828125, -8.68994140625, -7.767333984375, -6.8447265625, -5.922119140625, -4.99951171875, -4.076904296875, -3.154296875, -2.231689453125, -1.30908203125, -0.386474609375, 0.5361328125, 1.458740234375, 2.38134765625, 3.303955078125, 4.2265625, 5.149169921875, 6.07177734375, 6.994384765625, 7.9169921875, 8.839599609375, 9.76220703125, 10.684814453125, 11.607421875, 12.530029296875, 13.45263671875, 14.375244140625, 15.2978515625, 16.220458984375, 17.14306640625, 18.065673828125, 18.98828125, 19.910888671875, 20.83349609375, 21.756103515625, 22.6787109375, 23.601318359375, 24.52392578125, 25.446533203125, 26.369140625, 27.291748046875, 28.21435546875, 29.136962890625, 30.0595703125, 30.982177734375, 31.90478515625, 32.827392578125, 33.75]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [19.0, 408.0, 574.0, 16.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.012465476989746, -2.6173341274261475, -0.22220277786254883, 2.172928810119629, 4.568059921264648, 6.963191032409668, 9.358323097229004, 11.753453254699707, 14.148585319519043, 16.543716430664062, 18.9388484954834, 21.333980560302734, 23.729110717773438, 26.12424087524414, 28.51937484741211, 30.914505004882812, 33.309635162353516, 35.70476531982422, 38.09989929199219, 40.49502944946289, 42.890159606933594, 45.28529357910156, 47.680423736572266, 50.07555389404297, 52.47068786621094, 54.86581802368164, 57.26095199584961, 59.65608215332031, 62.051212310791016, 64.44634246826172, 66.84147644042969, 69.23660278320312, 71.6317367553711, 74.02687072753906, 76.4219970703125, 78.81713104248047, 81.21226501464844, 83.60739135742188, 86.00252532958984, 88.39765930175781, 90.79278564453125, 93.18791961669922, 95.58304595947266, 97.97817993164062, 100.3733139038086, 102.76844024658203, 105.16357421875, 107.55870056152344, 109.95384216308594, 112.3489761352539, 114.74410247802734, 117.13923645019531, 119.53437042236328, 121.92949676513672, 124.32463073730469, 126.71975708007812, 129.11488342285156, 131.510009765625, 133.9051513671875, 136.30027770996094, 138.69540405273438, 141.09054565429688, 143.4856719970703, 145.88079833984375, 148.27593994140625]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 14.0, 9.0, 7.0, 12.0, 17.0, 21.0, 21.0, 28.0, 29.0, 28.0, 27.0, 26.0, 46.0, 42.0, 62.0, 48.0, 38.0, 47.0, 49.0, 52.0, 51.0, 43.0, 35.0, 35.0, 39.0, 31.0, 27.0, 15.0, 16.0, 16.0, 9.0, 14.0, 13.0, 12.0, 8.0, 5.0, 6.0, 1.0, 4.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.16040802001953, -45.56102752685547, -43.961647033691406, -42.362266540527344, -40.76288604736328, -39.16350555419922, -37.564125061035156, -35.964744567871094, -34.36536407470703, -32.76598358154297, -31.166603088378906, -29.567222595214844, -27.96784210205078, -26.36846160888672, -24.769079208374023, -23.16969871520996, -21.570316314697266, -19.970935821533203, -18.37155532836914, -16.772174835205078, -15.1727933883667, -13.573412895202637, -11.974031448364258, -10.374650955200195, -8.775270462036133, -7.17588996887207, -5.57650899887085, -3.977128028869629, -2.3777475357055664, -0.7783670425415039, 0.821014404296875, 2.4203948974609375, 4.019775390625, 5.6191558837890625, 7.218536853790283, 8.817917823791504, 10.417298316955566, 12.016678810119629, 13.616060256958008, 15.21544075012207, 16.814821243286133, 18.414201736450195, 20.013582229614258, 21.612964630126953, 23.212345123291016, 24.811725616455078, 26.41110610961914, 28.010486602783203, 29.609867095947266, 31.209247589111328, 32.80862808227539, 34.40800857543945, 36.007389068603516, 37.60676956176758, 39.206153869628906, 40.80553436279297, 42.40491485595703, 44.004295349121094, 45.603675842285156, 47.20305633544922, 48.80243682861328, 50.401817321777344, 52.001197814941406, 53.60057830810547, 55.19995880126953]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 7.0, 4.0, 5.0, 8.0, 16.0, 9.0, 14.0, 24.0, 25.0, 34.0, 31.0, 47.0, 42.0, 49.0, 34.0, 46.0, 54.0, 59.0, 41.0, 66.0, 61.0, 36.0, 40.0, 46.0, 34.0, 32.0, 32.0, 18.0, 22.0, 27.0, 19.0, 12.0, 5.0, 3.0, 7.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.2890625, -5.122802734375, -4.95654296875, -4.790283203125, -4.6240234375, -4.457763671875, -4.29150390625, -4.125244140625, -3.958984375, -3.792724609375, -3.62646484375, -3.460205078125, -3.2939453125, -3.127685546875, -2.96142578125, -2.795166015625, -2.62890625, -2.462646484375, -2.29638671875, -2.130126953125, -1.9638671875, -1.797607421875, -1.63134765625, -1.465087890625, -1.298828125, -1.132568359375, -0.96630859375, -0.800048828125, -0.6337890625, -0.467529296875, -0.30126953125, -0.135009765625, 0.03125, 0.197509765625, 0.36376953125, 0.530029296875, 0.6962890625, 0.862548828125, 1.02880859375, 1.195068359375, 1.361328125, 1.527587890625, 1.69384765625, 1.860107421875, 2.0263671875, 2.192626953125, 2.35888671875, 2.525146484375, 2.69140625, 2.857666015625, 3.02392578125, 3.190185546875, 3.3564453125, 3.522705078125, 3.68896484375, 3.855224609375, 4.021484375, 4.187744140625, 4.35400390625, 4.520263671875, 4.6865234375, 4.852783203125, 5.01904296875, 5.185302734375, 5.3515625]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 7.0, 2.0, 3.0, 10.0, 5.0, 13.0, 12.0, 19.0, 25.0, 39.0, 49.0, 52.0, 94.0, 138.0, 298.0, 832.0, 3017.0, 19772.0, 366154.0, 3563850.0, 221603.0, 14459.0, 2437.0, 708.0, 260.0, 143.0, 67.0, 54.0, 48.0, 32.0, 20.0, 21.0, 20.0, 6.0, 6.0, 5.0, 7.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.453125, -21.801025390625, -21.14892578125, -20.496826171875, -19.8447265625, -19.192626953125, -18.54052734375, -17.888427734375, -17.236328125, -16.584228515625, -15.93212890625, -15.280029296875, -14.6279296875, -13.975830078125, -13.32373046875, -12.671630859375, -12.01953125, -11.367431640625, -10.71533203125, -10.063232421875, -9.4111328125, -8.759033203125, -8.10693359375, -7.454833984375, -6.802734375, -6.150634765625, -5.49853515625, -4.846435546875, -4.1943359375, -3.542236328125, -2.89013671875, -2.238037109375, -1.5859375, -0.933837890625, -0.28173828125, 0.370361328125, 1.0224609375, 1.674560546875, 2.32666015625, 2.978759765625, 3.630859375, 4.282958984375, 4.93505859375, 5.587158203125, 6.2392578125, 6.891357421875, 7.54345703125, 8.195556640625, 8.84765625, 9.499755859375, 10.15185546875, 10.803955078125, 11.4560546875, 12.108154296875, 12.76025390625, 13.412353515625, 14.064453125, 14.716552734375, 15.36865234375, 16.020751953125, 16.6728515625, 17.324951171875, 17.97705078125, 18.629150390625, 19.28125]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 10.0, 8.0, 11.0, 25.0, 29.0, 51.0, 99.0, 138.0, 198.0, 332.0, 473.0, 606.0, 659.0, 485.0, 361.0, 221.0, 118.0, 98.0, 56.0, 36.0, 26.0, 16.0, 10.0, 7.0, 2.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.046875, -17.44677734375, -16.8466796875, -16.24658203125, -15.646484375, -15.04638671875, -14.4462890625, -13.84619140625, -13.24609375, -12.64599609375, -12.0458984375, -11.44580078125, -10.845703125, -10.24560546875, -9.6455078125, -9.04541015625, -8.4453125, -7.84521484375, -7.2451171875, -6.64501953125, -6.044921875, -5.44482421875, -4.8447265625, -4.24462890625, -3.64453125, -3.04443359375, -2.4443359375, -1.84423828125, -1.244140625, -0.64404296875, -0.0439453125, 0.55615234375, 1.15625, 1.75634765625, 2.3564453125, 2.95654296875, 3.556640625, 4.15673828125, 4.7568359375, 5.35693359375, 5.95703125, 6.55712890625, 7.1572265625, 7.75732421875, 8.357421875, 8.95751953125, 9.5576171875, 10.15771484375, 10.7578125, 11.35791015625, 11.9580078125, 12.55810546875, 13.158203125, 13.75830078125, 14.3583984375, 14.95849609375, 15.55859375, 16.15869140625, 16.7587890625, 17.35888671875, 17.958984375, 18.55908203125, 19.1591796875, 19.75927734375, 20.359375]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 6.0, 9.0, 23.0, 22.0, 41.0, 83.0, 120.0, 231.0, 383.0, 985.0, 4300.0, 70229.0, 3707947.0, 396397.0, 10611.0, 1601.0, 596.0, 304.0, 135.0, 84.0, 63.0, 32.0, 34.0, 14.0, 7.0, 8.0, 4.0, 1.0, 2.0, 5.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.875, -32.44580078125, -31.0166015625, -29.58740234375, -28.158203125, -26.72900390625, -25.2998046875, -23.87060546875, -22.44140625, -21.01220703125, -19.5830078125, -18.15380859375, -16.724609375, -15.29541015625, -13.8662109375, -12.43701171875, -11.0078125, -9.57861328125, -8.1494140625, -6.72021484375, -5.291015625, -3.86181640625, -2.4326171875, -1.00341796875, 0.42578125, 1.85498046875, 3.2841796875, 4.71337890625, 6.142578125, 7.57177734375, 9.0009765625, 10.43017578125, 11.859375, 13.28857421875, 14.7177734375, 16.14697265625, 17.576171875, 19.00537109375, 20.4345703125, 21.86376953125, 23.29296875, 24.72216796875, 26.1513671875, 27.58056640625, 29.009765625, 30.43896484375, 31.8681640625, 33.29736328125, 34.7265625, 36.15576171875, 37.5849609375, 39.01416015625, 40.443359375, 41.87255859375, 43.3017578125, 44.73095703125, 46.16015625, 47.58935546875, 49.0185546875, 50.44775390625, 51.876953125, 53.30615234375, 54.7353515625, 56.16455078125, 57.59375]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 31.0, 232.0, 461.0, 243.0, 42.0, 6.0, 0.0, 1.0], "bins": [-401.98382568359375, -395.11151123046875, -388.2391662597656, -381.3668518066406, -374.4945068359375, -367.6221923828125, -360.7498779296875, -353.8775329589844, -347.0052185058594, -340.1329040527344, -333.26055908203125, -326.38824462890625, -319.5158996582031, -312.6435852050781, -305.771240234375, -298.89892578125, -292.026611328125, -285.154296875, -278.2819519042969, -271.4096374511719, -264.53729248046875, -257.66497802734375, -250.7926483154297, -243.92031860351562, -237.0479736328125, -230.17564392089844, -223.30331420898438, -216.43099975585938, -209.5586700439453, -202.68634033203125, -195.8140106201172, -188.94168090820312, -182.06936645507812, -175.19703674316406, -168.32470703125, -161.452392578125, -154.58006286621094, -147.70773315429688, -140.8354034423828, -133.96307373046875, -127.09074401855469, -120.21841430664062, -113.3460922241211, -106.47376251220703, -99.6014404296875, -92.72911071777344, -85.85678100585938, -78.98445129394531, -72.11212921142578, -65.23979949951172, -58.36747741699219, -51.495147705078125, -44.62282180786133, -37.75049591064453, -30.87816619873047, -24.005840301513672, -17.133514404296875, -10.261187553405762, -3.3888607025146484, 3.4834671020507812, 10.355792999267578, 17.228118896484375, 24.100448608398438, 30.972774505615234, 37.84510040283203]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 2.0, 5.0, 0.0, 6.0, 4.0, 8.0, 10.0, 9.0, 15.0, 4.0, 10.0, 12.0, 9.0, 18.0, 13.0, 26.0, 26.0, 17.0, 26.0, 25.0, 42.0, 28.0, 33.0, 34.0, 16.0, 44.0, 32.0, 25.0, 34.0, 44.0, 33.0, 42.0, 22.0, 36.0, 32.0, 18.0, 25.0, 25.0, 21.0, 22.0, 21.0, 22.0, 12.0, 13.0, 12.0, 6.0, 8.0, 10.0, 13.0, 11.0, 5.0, 6.0, 7.0, 5.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 3.0], "bins": [-35.4333381652832, -34.29182434082031, -33.150306701660156, -32.008792877197266, -30.867279052734375, -29.72576332092285, -28.584247589111328, -27.442733764648438, -26.301218032836914, -25.15970230102539, -24.0181884765625, -22.876672744750977, -21.735157012939453, -20.593643188476562, -19.45212745666504, -18.310611724853516, -17.169097900390625, -16.0275821685791, -14.886068344116211, -13.744552612304688, -12.60303783416748, -11.461523056030273, -10.32000732421875, -9.178492546081543, -8.036977767944336, -6.895462989807129, -5.753947734832764, -4.612432479858398, -3.4709177017211914, -2.3294029235839844, -1.1878876686096191, -0.046372413635253906, 1.0951461791992188, 2.236661195755005, 3.378176212310791, 4.519691467285156, 5.661206245422363, 6.80272102355957, 7.9442362785339355, 9.0857515335083, 10.227266311645508, 11.368781089782715, 12.510295867919922, 13.651811599731445, 14.793326377868652, 15.93484115600586, 17.076356887817383, 18.217872619628906, 19.359386444091797, 20.50090217590332, 21.64241600036621, 22.783931732177734, 23.925445556640625, 25.06696128845215, 26.208477020263672, 27.349990844726562, 28.491506576538086, 29.63302230834961, 30.7745361328125, 31.916051864624023, 33.05756759643555, 34.19908142089844, 35.34059524536133, 36.482112884521484, 37.623626708984375]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 6.0, 1.0, 9.0, 11.0, 10.0, 16.0, 14.0, 24.0, 17.0, 23.0, 28.0, 19.0, 28.0, 42.0, 39.0, 31.0, 42.0, 51.0, 46.0, 48.0, 47.0, 38.0, 44.0, 47.0, 45.0, 29.0, 38.0, 21.0, 28.0, 30.0, 29.0, 22.0, 13.0, 13.0, 12.0, 8.0, 15.0, 6.0, 7.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0625, -3.9215087890625, -3.780517578125, -3.6395263671875, -3.49853515625, -3.3575439453125, -3.216552734375, -3.0755615234375, -2.9345703125, -2.7935791015625, -2.652587890625, -2.5115966796875, -2.37060546875, -2.2296142578125, -2.088623046875, -1.9476318359375, -1.806640625, -1.6656494140625, -1.524658203125, -1.3836669921875, -1.24267578125, -1.1016845703125, -0.960693359375, -0.8197021484375, -0.6787109375, -0.5377197265625, -0.396728515625, -0.2557373046875, -0.11474609375, 0.0262451171875, 0.167236328125, 0.3082275390625, 0.44921875, 0.5902099609375, 0.731201171875, 0.8721923828125, 1.01318359375, 1.1541748046875, 1.295166015625, 1.4361572265625, 1.5771484375, 1.7181396484375, 1.859130859375, 2.0001220703125, 2.14111328125, 2.2821044921875, 2.423095703125, 2.5640869140625, 2.705078125, 2.8460693359375, 2.987060546875, 3.1280517578125, 3.26904296875, 3.4100341796875, 3.551025390625, 3.6920166015625, 3.8330078125, 3.9739990234375, 4.114990234375, 4.2559814453125, 4.39697265625, 4.5379638671875, 4.678955078125, 4.8199462890625, 4.9609375]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 5.0, 7.0, 8.0, 14.0, 21.0, 29.0, 49.0, 66.0, 86.0, 160.0, 175.0, 274.0, 420.0, 599.0, 855.0, 1381.0, 1958.0, 2964.0, 4537.0, 6884.0, 10491.0, 16619.0, 26619.0, 42629.0, 70017.0, 114301.0, 170342.0, 193117.0, 143829.0, 90858.0, 55500.0, 34051.0, 20778.0, 13464.0, 8534.0, 5580.0, 3717.0, 2494.0, 1644.0, 1079.0, 687.0, 526.0, 397.0, 209.0, 170.0, 130.0, 97.0, 74.0, 29.0, 18.0, 15.0, 30.0, 12.0, 13.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.453369140625, -0.4397392272949219, -0.42610931396484375, -0.4124794006347656, -0.3988494873046875, -0.3852195739746094, -0.37158966064453125, -0.3579597473144531, -0.344329833984375, -0.3306999206542969, -0.31707000732421875, -0.3034400939941406, -0.2898101806640625, -0.2761802673339844, -0.26255035400390625, -0.24892044067382812, -0.23529052734375, -0.22166061401367188, -0.20803070068359375, -0.19440078735351562, -0.1807708740234375, -0.16714096069335938, -0.15351104736328125, -0.13988113403320312, -0.126251220703125, -0.11262130737304688, -0.09899139404296875, -0.08536148071289062, -0.0717315673828125, -0.058101654052734375, -0.04447174072265625, -0.030841827392578125, -0.0172119140625, -0.003582000732421875, 0.01004791259765625, 0.023677825927734375, 0.0373077392578125, 0.050937652587890625, 0.06456756591796875, 0.07819747924804688, 0.091827392578125, 0.10545730590820312, 0.11908721923828125, 0.13271713256835938, 0.1463470458984375, 0.15997695922851562, 0.17360687255859375, 0.18723678588867188, 0.20086669921875, 0.21449661254882812, 0.22812652587890625, 0.24175643920898438, 0.2553863525390625, 0.2690162658691406, 0.28264617919921875, 0.2962760925292969, 0.309906005859375, 0.3235359191894531, 0.33716583251953125, 0.3507957458496094, 0.3644256591796875, 0.3780555725097656, 0.39168548583984375, 0.4053153991699219, 0.4189453125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 3.0, 2.0, 5.0, 5.0, 7.0, 9.0, 10.0, 14.0, 12.0, 16.0, 11.0, 11.0, 24.0, 23.0, 16.0, 25.0, 32.0, 32.0, 25.0, 25.0, 38.0, 40.0, 52.0, 35.0, 1069.0, 34.0, 37.0, 33.0, 34.0, 34.0, 42.0, 34.0, 27.0, 43.0, 30.0, 21.0, 23.0, 10.0, 12.0, 8.0, 11.0, 18.0, 4.0, 4.0, 10.0, 8.0, 3.0, 6.0, 1.0, 3.0, 1.0, 2.0, 1.0, 4.0], "bins": [-2.74609375, -2.667266845703125, -2.58843994140625, -2.509613037109375, -2.4307861328125, -2.351959228515625, -2.27313232421875, -2.194305419921875, -2.115478515625, -2.036651611328125, -1.95782470703125, -1.878997802734375, -1.8001708984375, -1.721343994140625, -1.64251708984375, -1.563690185546875, -1.48486328125, -1.406036376953125, -1.32720947265625, -1.248382568359375, -1.1695556640625, -1.090728759765625, -1.01190185546875, -0.933074951171875, -0.854248046875, -0.775421142578125, -0.69659423828125, -0.617767333984375, -0.5389404296875, -0.460113525390625, -0.38128662109375, -0.302459716796875, -0.2236328125, -0.144805908203125, -0.06597900390625, 0.012847900390625, 0.0916748046875, 0.170501708984375, 0.24932861328125, 0.328155517578125, 0.406982421875, 0.485809326171875, 0.56463623046875, 0.643463134765625, 0.7222900390625, 0.801116943359375, 0.87994384765625, 0.958770751953125, 1.03759765625, 1.116424560546875, 1.19525146484375, 1.274078369140625, 1.3529052734375, 1.431732177734375, 1.51055908203125, 1.589385986328125, 1.668212890625, 1.747039794921875, 1.82586669921875, 1.904693603515625, 1.9835205078125, 2.062347412109375, 2.14117431640625, 2.220001220703125, 2.298828125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 4.0, 5.0, 5.0, 18.0, 30.0, 25.0, 50.0, 90.0, 137.0, 195.0, 330.0, 588.0, 820.0, 1293.0, 2125.0, 3356.0, 4986.0, 8003.0, 12510.0, 19494.0, 30383.0, 46139.0, 70379.0, 102728.0, 138598.0, 1205070.0, 140136.0, 104518.0, 72107.0, 46951.0, 30606.0, 19909.0, 12559.0, 8246.0, 5247.0, 3467.0, 2195.0, 1386.0, 918.0, 541.0, 365.0, 211.0, 146.0, 103.0, 45.0, 35.0, 34.0, 14.0, 13.0, 7.0, 6.0, 3.0, 2.0, 2.0, 2.0], "bins": [-0.332275390625, -0.3226509094238281, -0.31302642822265625, -0.3034019470214844, -0.2937774658203125, -0.2841529846191406, -0.27452850341796875, -0.2649040222167969, -0.255279541015625, -0.24565505981445312, -0.23603057861328125, -0.22640609741210938, -0.2167816162109375, -0.20715713500976562, -0.19753265380859375, -0.18790817260742188, -0.17828369140625, -0.16865921020507812, -0.15903472900390625, -0.14941024780273438, -0.1397857666015625, -0.13016128540039062, -0.12053680419921875, -0.11091232299804688, -0.101287841796875, -0.09166336059570312, -0.08203887939453125, -0.07241439819335938, -0.0627899169921875, -0.053165435791015625, -0.04354095458984375, -0.033916473388671875, -0.0242919921875, -0.014667510986328125, -0.00504302978515625, 0.004581451416015625, 0.0142059326171875, 0.023830413818359375, 0.03345489501953125, 0.043079376220703125, 0.052703857421875, 0.062328338623046875, 0.07195281982421875, 0.08157730102539062, 0.0912017822265625, 0.10082626342773438, 0.11045074462890625, 0.12007522583007812, 0.12969970703125, 0.13932418823242188, 0.14894866943359375, 0.15857315063476562, 0.1681976318359375, 0.17782211303710938, 0.18744659423828125, 0.19707107543945312, 0.206695556640625, 0.21632003784179688, 0.22594451904296875, 0.23556900024414062, 0.2451934814453125, 0.2548179626464844, 0.26444244384765625, 0.2740669250488281, 0.28369140625]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 7.0, 3.0, 7.0, 12.0, 12.0, 19.0, 18.0, 37.0, 41.0, 51.0, 55.0, 81.0, 99.0, 94.0, 81.0, 83.0, 71.0, 52.0, 48.0, 38.0, 18.0, 11.0, 15.0, 13.0, 6.0, 7.0, 4.0, 10.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00237274169921875, -0.0022725462913513184, -0.0021723508834838867, -0.002072155475616455, -0.0019719600677490234, -0.0018717646598815918, -0.0017715692520141602, -0.0016713738441467285, -0.0015711784362792969, -0.0014709830284118652, -0.0013707876205444336, -0.001270592212677002, -0.0011703968048095703, -0.0010702013969421387, -0.000970005989074707, -0.0008698105812072754, -0.0007696151733398438, -0.0006694197654724121, -0.0005692243576049805, -0.00046902894973754883, -0.0003688335418701172, -0.00026863813400268555, -0.0001684427261352539, -6.824731826782227e-05, 3.1948089599609375e-05, 0.00013214349746704102, 0.00023233890533447266, 0.0003325343132019043, 0.00043272972106933594, 0.0005329251289367676, 0.0006331205368041992, 0.0007333159446716309, 0.0008335113525390625, 0.0009337067604064941, 0.0010339021682739258, 0.0011340975761413574, 0.001234292984008789, 0.0013344883918762207, 0.0014346837997436523, 0.001534879207611084, 0.0016350746154785156, 0.0017352700233459473, 0.001835465431213379, 0.0019356608390808105, 0.002035856246948242, 0.002136051654815674, 0.0022362470626831055, 0.002336442470550537, 0.0024366378784179688, 0.0025368332862854004, 0.002637028694152832, 0.0027372241020202637, 0.0028374195098876953, 0.002937614917755127, 0.0030378103256225586, 0.0031380057334899902, 0.003238201141357422, 0.0033383965492248535, 0.003438591957092285, 0.003538787364959717, 0.0036389827728271484, 0.00373917818069458, 0.0038393735885620117, 0.003939568996429443, 0.004039764404296875]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 3.0, 8.0, 10.0, 6.0, 14.0, 35.0, 41.0, 34.0, 72.0, 101.0, 141.0, 260.0, 411.0, 1099.0, 904138.0, 140365.0, 791.0, 351.0, 246.0, 132.0, 88.0, 43.0, 45.0, 44.0, 20.0, 11.0, 11.0, 10.0, 7.0, 5.0, 7.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0], "bins": [-0.08294677734375, -0.08091878890991211, -0.07889080047607422, -0.07686281204223633, -0.07483482360839844, -0.07280683517456055, -0.07077884674072266, -0.06875085830688477, -0.06672286987304688, -0.06469488143920898, -0.0626668930053711, -0.0606389045715332, -0.05861091613769531, -0.05658292770385742, -0.05455493927001953, -0.05252695083618164, -0.05049896240234375, -0.04847097396850586, -0.04644298553466797, -0.04441499710083008, -0.04238700866699219, -0.0403590202331543, -0.038331031799316406, -0.036303043365478516, -0.034275054931640625, -0.032247066497802734, -0.030219078063964844, -0.028191089630126953, -0.026163101196289062, -0.024135112762451172, -0.02210712432861328, -0.02007913589477539, -0.0180511474609375, -0.01602315902709961, -0.013995170593261719, -0.011967182159423828, -0.009939193725585938, -0.007911205291748047, -0.005883216857910156, -0.0038552284240722656, -0.001827239990234375, 0.00020074844360351562, 0.0022287368774414062, 0.004256725311279297, 0.0062847137451171875, 0.008312702178955078, 0.010340690612792969, 0.01236867904663086, 0.01439666748046875, 0.01642465591430664, 0.01845264434814453, 0.020480632781982422, 0.022508621215820312, 0.024536609649658203, 0.026564598083496094, 0.028592586517333984, 0.030620574951171875, 0.032648563385009766, 0.034676551818847656, 0.03670454025268555, 0.03873252868652344, 0.04076051712036133, 0.04278850555419922, 0.04481649398803711, 0.046844482421875]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 1008.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.051476843655109406, -0.05020083114504814, -0.04892481863498688, -0.04764880612492561, -0.04637279361486435, -0.04509677737951279, -0.04382076486945152, -0.04254475235939026, -0.041268739849328995, -0.03999272733926773, -0.03871671482920647, -0.0374407023191452, -0.03616468608379364, -0.034888673573732376, -0.03361266106367111, -0.03233664855360985, -0.031060636043548584, -0.02978462353348732, -0.028508611023426056, -0.027232596650719643, -0.02595658414065838, -0.024680571630597115, -0.0234045572578907, -0.022128544747829437, -0.020852532237768173, -0.01957651972770691, -0.018300507217645645, -0.017024492844939232, -0.015748480334877968, -0.014472467824816704, -0.013196454383432865, -0.011920440942049026, -0.010644424706697464, -0.0093684121966362, -0.008092398755252361, -0.00681638577952981, -0.005540372803807259, -0.004264359828084707, -0.002988346852362156, -0.0017123334109783173, -0.0004363209009170532, 0.0008396920748054981, 0.0021157050505280495, 0.003391718026250601, 0.004667731001973152, 0.0059437439776957035, 0.007219756953418255, 0.008495770394802094, 0.009771782904863358, 0.011047795414924622, 0.01232380885630846, 0.013599822297692299, 0.014875834807753563, 0.016151847317814827, 0.01742786169052124, 0.018703874200582504, 0.01997988671064377, 0.021255899220705032, 0.022531911730766296, 0.02380792610347271, 0.025083938613533974, 0.026359951123595238, 0.02763596549630165, 0.028911978006362915, 0.03018799051642418]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 8.0, 12.0, 15.0, 20.0, 19.0, 32.0, 25.0, 44.0, 45.0, 57.0, 55.0, 51.0, 64.0, 71.0, 76.0, 81.0, 66.0, 52.0, 45.0, 36.0, 24.0, 30.0, 17.0, 29.0, 15.0, 7.0, 9.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015898346900939941, -0.0015199529007077217, -0.0014500711113214493, -0.0013801893219351768, -0.0013103075325489044, -0.001240425743162632, -0.0011705439537763596, -0.0011006621643900871, -0.0010307803750038147, -0.0009608985856175423, -0.0008910167962312698, -0.0008211350068449974, -0.000751253217458725, -0.0006813714280724525, -0.0006114896386861801, -0.0005416078492999077, -0.00047172605991363525, -0.0004018442705273628, -0.0003319624811410904, -0.00026208069175481796, -0.00019219890236854553, -0.0001223171129822731, -5.243532359600067e-05, 1.744646579027176e-05, 8.732825517654419e-05, 0.00015721004456281662, 0.00022709183394908905, 0.0002969736233353615, 0.0003668554127216339, 0.00043673720210790634, 0.0005066189914941788, 0.0005765007808804512, 0.0006463825702667236, 0.0007162643596529961, 0.0007861461490392685, 0.0008560279384255409, 0.0009259097278118134, 0.0009957915171980858, 0.0010656733065843582, 0.0011355550959706306, 0.001205436885356903, 0.0012753186747431755, 0.001345200464129448, 0.0014150822535157204, 0.0014849640429019928, 0.0015548458322882652, 0.0016247276216745377, 0.00169460941106081, 0.0017644912004470825, 0.001834372989833355, 0.0019042547792196274, 0.0019741365686059, 0.0020440183579921722, 0.0021139001473784447, 0.002183781936764717, 0.0022536637261509895, 0.002323545515537262, 0.0023934273049235344, 0.002463309094309807, 0.0025331908836960793, 0.0026030726730823517, 0.002672954462468624, 0.0027428362518548965, 0.002812718041241169, 0.0028825998306274414]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 6.0, 1.0, 9.0, 11.0, 10.0, 16.0, 14.0, 24.0, 17.0, 23.0, 28.0, 19.0, 28.0, 42.0, 39.0, 31.0, 42.0, 51.0, 46.0, 48.0, 47.0, 38.0, 44.0, 47.0, 45.0, 29.0, 38.0, 21.0, 28.0, 30.0, 29.0, 22.0, 13.0, 13.0, 12.0, 8.0, 15.0, 6.0, 7.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0625, -3.9215087890625, -3.780517578125, -3.6395263671875, -3.49853515625, -3.3575439453125, -3.216552734375, -3.0755615234375, -2.9345703125, -2.7935791015625, -2.652587890625, -2.5115966796875, -2.37060546875, -2.2296142578125, -2.088623046875, -1.9476318359375, -1.806640625, -1.6656494140625, -1.524658203125, -1.3836669921875, -1.24267578125, -1.1016845703125, -0.960693359375, -0.8197021484375, -0.6787109375, -0.5377197265625, -0.396728515625, -0.2557373046875, -0.11474609375, 0.0262451171875, 0.167236328125, 0.3082275390625, 0.44921875, 0.5902099609375, 0.731201171875, 0.8721923828125, 1.01318359375, 1.1541748046875, 1.295166015625, 1.4361572265625, 1.5771484375, 1.7181396484375, 1.859130859375, 2.0001220703125, 2.14111328125, 2.2821044921875, 2.423095703125, 2.5640869140625, 2.705078125, 2.8460693359375, 2.987060546875, 3.1280517578125, 3.26904296875, 3.4100341796875, 3.551025390625, 3.6920166015625, 3.8330078125, 3.9739990234375, 4.114990234375, 4.2559814453125, 4.39697265625, 4.5379638671875, 4.678955078125, 4.8199462890625, 4.9609375]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 6.0, 13.0, 21.0, 37.0, 43.0, 63.0, 109.0, 177.0, 330.0, 525.0, 966.0, 1787.0, 3128.0, 5823.0, 12117.0, 28929.0, 91019.0, 440442.0, 341067.0, 74438.0, 25067.0, 10568.0, 5298.0, 2769.0, 1603.0, 942.0, 530.0, 313.0, 179.0, 99.0, 57.0, 37.0, 20.0, 14.0, 9.0, 4.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0], "bins": [-4.94140625, -4.817626953125, -4.69384765625, -4.570068359375, -4.4462890625, -4.322509765625, -4.19873046875, -4.074951171875, -3.951171875, -3.827392578125, -3.70361328125, -3.579833984375, -3.4560546875, -3.332275390625, -3.20849609375, -3.084716796875, -2.9609375, -2.837158203125, -2.71337890625, -2.589599609375, -2.4658203125, -2.342041015625, -2.21826171875, -2.094482421875, -1.970703125, -1.846923828125, -1.72314453125, -1.599365234375, -1.4755859375, -1.351806640625, -1.22802734375, -1.104248046875, -0.98046875, -0.856689453125, -0.73291015625, -0.609130859375, -0.4853515625, -0.361572265625, -0.23779296875, -0.114013671875, 0.009765625, 0.133544921875, 0.25732421875, 0.381103515625, 0.5048828125, 0.628662109375, 0.75244140625, 0.876220703125, 1.0, 1.123779296875, 1.24755859375, 1.371337890625, 1.4951171875, 1.618896484375, 1.74267578125, 1.866455078125, 1.990234375, 2.114013671875, 2.23779296875, 2.361572265625, 2.4853515625, 2.609130859375, 2.73291015625, 2.856689453125, 2.98046875]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 6.0, 7.0, 6.0, 7.0, 14.0, 13.0, 14.0, 16.0, 24.0, 25.0, 28.0, 43.0, 43.0, 44.0, 52.0, 61.0, 71.0, 306.0, 1725.0, 105.0, 57.0, 46.0, 48.0, 43.0, 39.0, 26.0, 29.0, 33.0, 30.0, 20.0, 20.0, 10.0, 15.0, 8.0, 7.0, 7.0, 5.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.15625, -16.58740234375, -16.0185546875, -15.44970703125, -14.880859375, -14.31201171875, -13.7431640625, -13.17431640625, -12.60546875, -12.03662109375, -11.4677734375, -10.89892578125, -10.330078125, -9.76123046875, -9.1923828125, -8.62353515625, -8.0546875, -7.48583984375, -6.9169921875, -6.34814453125, -5.779296875, -5.21044921875, -4.6416015625, -4.07275390625, -3.50390625, -2.93505859375, -2.3662109375, -1.79736328125, -1.228515625, -0.65966796875, -0.0908203125, 0.47802734375, 1.046875, 1.61572265625, 2.1845703125, 2.75341796875, 3.322265625, 3.89111328125, 4.4599609375, 5.02880859375, 5.59765625, 6.16650390625, 6.7353515625, 7.30419921875, 7.873046875, 8.44189453125, 9.0107421875, 9.57958984375, 10.1484375, 10.71728515625, 11.2861328125, 11.85498046875, 12.423828125, 12.99267578125, 13.5615234375, 14.13037109375, 14.69921875, 15.26806640625, 15.8369140625, 16.40576171875, 16.974609375, 17.54345703125, 18.1123046875, 18.68115234375, 19.25]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 5.0, 7.0, 7.0, 10.0, 11.0, 14.0, 22.0, 29.0, 29.0, 38.0, 40.0, 48.0, 72.0, 118.0, 176.0, 372.0, 1234.0, 11390.0, 2969667.0, 157545.0, 3473.0, 667.0, 269.0, 133.0, 73.0, 65.0, 40.0, 39.0, 29.0, 15.0, 14.0, 11.0, 16.0, 13.0, 5.0, 6.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.15625, -31.20458984375, -30.2529296875, -29.30126953125, -28.349609375, -27.39794921875, -26.4462890625, -25.49462890625, -24.54296875, -23.59130859375, -22.6396484375, -21.68798828125, -20.736328125, -19.78466796875, -18.8330078125, -17.88134765625, -16.9296875, -15.97802734375, -15.0263671875, -14.07470703125, -13.123046875, -12.17138671875, -11.2197265625, -10.26806640625, -9.31640625, -8.36474609375, -7.4130859375, -6.46142578125, -5.509765625, -4.55810546875, -3.6064453125, -2.65478515625, -1.703125, -0.75146484375, 0.2001953125, 1.15185546875, 2.103515625, 3.05517578125, 4.0068359375, 4.95849609375, 5.91015625, 6.86181640625, 7.8134765625, 8.76513671875, 9.716796875, 10.66845703125, 11.6201171875, 12.57177734375, 13.5234375, 14.47509765625, 15.4267578125, 16.37841796875, 17.330078125, 18.28173828125, 19.2333984375, 20.18505859375, 21.13671875, 22.08837890625, 23.0400390625, 23.99169921875, 24.943359375, 25.89501953125, 26.8466796875, 27.79833984375, 28.75]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [18.0, 218.0, 684.0, 92.0, 8.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.627401351928711, -4.445851802825928, -1.2643022537231445, 1.9172477722167969, 5.098796844482422, 8.280345916748047, 11.461896896362305, 14.64344596862793, 17.824995040893555, 21.00654411315918, 24.188095092773438, 27.369644165039062, 30.551193237304688, 33.73274230957031, 36.91429138183594, 40.09584045410156, 43.27738952636719, 46.45893859863281, 49.64048767089844, 52.82203674316406, 56.00358581542969, 59.18513488769531, 62.3666877746582, 65.54823303222656, 68.72978973388672, 71.91133880615234, 75.09288787841797, 78.2744369506836, 81.45598602294922, 84.63753509521484, 87.819091796875, 91.00064086914062, 94.18218994140625, 97.36373901367188, 100.5452880859375, 103.72683715820312, 106.90838623046875, 110.08993530273438, 113.271484375, 116.45303344726562, 119.63458251953125, 122.81613159179688, 125.9976806640625, 129.17922973632812, 132.36077880859375, 135.54232788085938, 138.723876953125, 141.90542602539062, 145.08697509765625, 148.26852416992188, 151.4500732421875, 154.63162231445312, 157.81317138671875, 160.99472045898438, 164.17626953125, 167.35781860351562, 170.5393829345703, 173.72093200683594, 176.90248107910156, 180.0840301513672, 183.2655792236328, 186.44712829589844, 189.62867736816406, 192.8102264404297, 195.9917755126953]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 3.0, 10.0, 5.0, 12.0, 9.0, 12.0, 20.0, 18.0, 22.0, 23.0, 18.0, 18.0, 20.0, 27.0, 27.0, 36.0, 34.0, 39.0, 38.0, 46.0, 31.0, 35.0, 45.0, 39.0, 46.0, 38.0, 36.0, 33.0, 26.0, 40.0, 24.0, 21.0, 19.0, 22.0, 17.0, 13.0, 20.0, 20.0, 13.0, 4.0, 5.0, 4.0, 7.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-50.74734115600586, -49.18922424316406, -47.631107330322266, -46.07299041748047, -44.51487350463867, -42.956756591796875, -41.39863967895508, -39.84052276611328, -38.282405853271484, -36.72428894042969, -35.16617202758789, -33.608055114746094, -32.0499382019043, -30.4918212890625, -28.933704376220703, -27.375587463378906, -25.817468643188477, -24.25935173034668, -22.701234817504883, -21.143117904663086, -19.58500099182129, -18.026884078979492, -16.468765258789062, -14.910649299621582, -13.352532386779785, -11.794415473937988, -10.236298561096191, -8.678180694580078, -7.1200642585754395, -5.561947345733643, -4.0038299560546875, -2.4457130432128906, -0.8875961303710938, 0.6705209016799927, 2.228637933731079, 3.786755084991455, 5.344871997833252, 6.902988910675049, 8.461106300354004, 10.0192232131958, 11.577340126037598, 13.135457038879395, 14.693573951721191, 16.251691818237305, 17.8098087310791, 19.3679256439209, 20.926042556762695, 22.484159469604492, 24.04227638244629, 25.600393295288086, 27.158510208129883, 28.71662712097168, 30.274744033813477, 31.832860946655273, 33.3909797668457, 34.9490966796875, 36.5072135925293, 38.065330505371094, 39.62344741821289, 41.18156433105469, 42.739681243896484, 44.29779815673828, 45.85591506958008, 47.414031982421875, 48.97214889526367]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 5.0, 8.0, 12.0, 4.0, 11.0, 14.0, 17.0, 17.0, 23.0, 28.0, 22.0, 27.0, 35.0, 39.0, 40.0, 30.0, 52.0, 42.0, 49.0, 48.0, 44.0, 38.0, 52.0, 35.0, 47.0, 30.0, 33.0, 24.0, 40.0, 26.0, 24.0, 12.0, 10.0, 15.0, 14.0, 7.0, 9.0, 6.0, 6.0, 5.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3203125, -4.17340087890625, -4.0264892578125, -3.87957763671875, -3.732666015625, -3.58575439453125, -3.4388427734375, -3.29193115234375, -3.14501953125, -2.99810791015625, -2.8511962890625, -2.70428466796875, -2.557373046875, -2.41046142578125, -2.2635498046875, -2.11663818359375, -1.9697265625, -1.82281494140625, -1.6759033203125, -1.52899169921875, -1.382080078125, -1.23516845703125, -1.0882568359375, -0.94134521484375, -0.79443359375, -0.64752197265625, -0.5006103515625, -0.35369873046875, -0.206787109375, -0.05987548828125, 0.0870361328125, 0.23394775390625, 0.380859375, 0.52777099609375, 0.6746826171875, 0.82159423828125, 0.968505859375, 1.11541748046875, 1.2623291015625, 1.40924072265625, 1.55615234375, 1.70306396484375, 1.8499755859375, 1.99688720703125, 2.143798828125, 2.29071044921875, 2.4376220703125, 2.58453369140625, 2.7314453125, 2.87835693359375, 3.0252685546875, 3.17218017578125, 3.319091796875, 3.46600341796875, 3.6129150390625, 3.75982666015625, 3.90673828125, 4.05364990234375, 4.2005615234375, 4.34747314453125, 4.494384765625, 4.64129638671875, 4.7882080078125, 4.93511962890625, 5.08203125]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 6.0, 6.0, 7.0, 10.0, 15.0, 8.0, 26.0, 19.0, 28.0, 28.0, 43.0, 42.0, 55.0, 91.0, 212.0, 1000.0, 8653.0, 242223.0, 3808525.0, 126582.0, 5577.0, 649.0, 141.0, 75.0, 43.0, 40.0, 31.0, 24.0, 25.0, 24.0, 17.0, 17.0, 6.0, 10.0, 10.0, 8.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.640625, -23.80322265625, -22.9658203125, -22.12841796875, -21.291015625, -20.45361328125, -19.6162109375, -18.77880859375, -17.94140625, -17.10400390625, -16.2666015625, -15.42919921875, -14.591796875, -13.75439453125, -12.9169921875, -12.07958984375, -11.2421875, -10.40478515625, -9.5673828125, -8.72998046875, -7.892578125, -7.05517578125, -6.2177734375, -5.38037109375, -4.54296875, -3.70556640625, -2.8681640625, -2.03076171875, -1.193359375, -0.35595703125, 0.4814453125, 1.31884765625, 2.15625, 2.99365234375, 3.8310546875, 4.66845703125, 5.505859375, 6.34326171875, 7.1806640625, 8.01806640625, 8.85546875, 9.69287109375, 10.5302734375, 11.36767578125, 12.205078125, 13.04248046875, 13.8798828125, 14.71728515625, 15.5546875, 16.39208984375, 17.2294921875, 18.06689453125, 18.904296875, 19.74169921875, 20.5791015625, 21.41650390625, 22.25390625, 23.09130859375, 23.9287109375, 24.76611328125, 25.603515625, 26.44091796875, 27.2783203125, 28.11572265625, 28.953125]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 6.0, 5.0, 6.0, 11.0, 8.0, 22.0, 45.0, 66.0, 83.0, 116.0, 202.0, 207.0, 329.0, 476.0, 573.0, 552.0, 447.0, 304.0, 210.0, 144.0, 86.0, 57.0, 40.0, 23.0, 15.0, 14.0, 10.0, 5.0, 5.0, 6.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-21.3125, -20.802001953125, -20.29150390625, -19.781005859375, -19.2705078125, -18.760009765625, -18.24951171875, -17.739013671875, -17.228515625, -16.718017578125, -16.20751953125, -15.697021484375, -15.1865234375, -14.676025390625, -14.16552734375, -13.655029296875, -13.14453125, -12.634033203125, -12.12353515625, -11.613037109375, -11.1025390625, -10.592041015625, -10.08154296875, -9.571044921875, -9.060546875, -8.550048828125, -8.03955078125, -7.529052734375, -7.0185546875, -6.508056640625, -5.99755859375, -5.487060546875, -4.9765625, -4.466064453125, -3.95556640625, -3.445068359375, -2.9345703125, -2.424072265625, -1.91357421875, -1.403076171875, -0.892578125, -0.382080078125, 0.12841796875, 0.638916015625, 1.1494140625, 1.659912109375, 2.17041015625, 2.680908203125, 3.19140625, 3.701904296875, 4.21240234375, 4.722900390625, 5.2333984375, 5.743896484375, 6.25439453125, 6.764892578125, 7.275390625, 7.785888671875, 8.29638671875, 8.806884765625, 9.3173828125, 9.827880859375, 10.33837890625, 10.848876953125, 11.359375]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [3.0, 7.0, 0.0, 16.0, 9.0, 27.0, 39.0, 70.0, 88.0, 183.0, 359.0, 1026.0, 10520.0, 1109813.0, 3051089.0, 18770.0, 1358.0, 392.0, 197.0, 133.0, 68.0, 44.0, 37.0, 16.0, 14.0, 6.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.296875, -23.501220703125, -21.70556640625, -19.909912109375, -18.1142578125, -16.318603515625, -14.52294921875, -12.727294921875, -10.931640625, -9.135986328125, -7.34033203125, -5.544677734375, -3.7490234375, -1.953369140625, -0.15771484375, 1.637939453125, 3.43359375, 5.229248046875, 7.02490234375, 8.820556640625, 10.6162109375, 12.411865234375, 14.20751953125, 16.003173828125, 17.798828125, 19.594482421875, 21.39013671875, 23.185791015625, 24.9814453125, 26.777099609375, 28.57275390625, 30.368408203125, 32.1640625, 33.959716796875, 35.75537109375, 37.551025390625, 39.3466796875, 41.142333984375, 42.93798828125, 44.733642578125, 46.529296875, 48.324951171875, 50.12060546875, 51.916259765625, 53.7119140625, 55.507568359375, 57.30322265625, 59.098876953125, 60.89453125, 62.690185546875, 64.48583984375, 66.281494140625, 68.0771484375, 69.872802734375, 71.66845703125, 73.464111328125, 75.259765625, 77.055419921875, 78.85107421875, 80.646728515625, 82.4423828125, 84.238037109375, 86.03369140625, 87.829345703125, 89.625]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 10.0, 15.0, 48.0, 80.0, 145.0, 229.0, 213.0, 149.0, 61.0, 36.0, 20.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-160.05523681640625, -156.84902954101562, -153.642822265625, -150.4365997314453, -147.2303924560547, -144.02418518066406, -140.81796264648438, -137.61175537109375, -134.40554809570312, -131.1993408203125, -127.99312591552734, -124.78691101074219, -121.58070373535156, -118.37449645996094, -115.16828155517578, -111.96206665039062, -108.755859375, -105.54965209960938, -102.34343719482422, -99.13722229003906, -95.93101501464844, -92.72480773925781, -89.51859283447266, -86.3123779296875, -83.10617065429688, -79.89996337890625, -76.6937484741211, -73.48753356933594, -70.28132629394531, -67.07511901855469, -63.86890411376953, -60.66269302368164, -57.45648956298828, -54.25027847290039, -51.0440673828125, -47.83785629272461, -44.63164520263672, -41.42543411254883, -38.21922302246094, -35.01301193237305, -31.806800842285156, -28.600589752197266, -25.394378662109375, -22.188167572021484, -18.981956481933594, -15.775745391845703, -12.569534301757812, -9.363323211669922, -6.157112121582031, -2.9509010314941406, 0.25531005859375, 3.4615211486816406, 6.667732238769531, 9.873943328857422, 13.080154418945312, 16.286365509033203, 19.492576599121094, 22.698787689208984, 25.904998779296875, 29.111209869384766, 32.317420959472656, 35.52363204956055, 38.72984313964844, 41.93605422973633, 45.14226531982422]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 3.0, 3.0, 4.0, 4.0, 8.0, 7.0, 7.0, 11.0, 14.0, 18.0, 18.0, 32.0, 26.0, 16.0, 44.0, 25.0, 35.0, 34.0, 32.0, 34.0, 38.0, 44.0, 44.0, 37.0, 29.0, 38.0, 42.0, 39.0, 34.0, 19.0, 35.0, 29.0, 33.0, 20.0, 28.0, 20.0, 23.0, 6.0, 12.0, 10.0, 12.0, 15.0, 8.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-42.816436767578125, -41.521385192871094, -40.22633743286133, -38.9312858581543, -37.63623809814453, -36.3411865234375, -35.04613494873047, -33.75108337402344, -32.45603561401367, -31.160985946655273, -29.865936279296875, -28.570884704589844, -27.275835037231445, -25.980785369873047, -24.685733795166016, -23.390684127807617, -22.09563446044922, -20.80058479309082, -19.505535125732422, -18.21048355102539, -16.915433883666992, -15.620384216308594, -14.325333595275879, -13.030282974243164, -11.735233306884766, -10.440183639526367, -9.145133018493652, -7.850082874298096, -6.555032730102539, -5.259982585906982, -3.964932441711426, -2.669881820678711, -1.3748321533203125, -0.07978200912475586, 1.2152681350708008, 2.5103182792663574, 3.805368423461914, 5.100418567657471, 6.395468711853027, 7.690519332885742, 8.98556900024414, 10.280618667602539, 11.575669288635254, 12.870719909667969, 14.165769577026367, 15.460819244384766, 16.755870819091797, 18.050920486450195, 19.345970153808594, 20.641019821166992, 21.93606948852539, 23.231121063232422, 24.52617073059082, 25.82122039794922, 27.11627197265625, 28.41132164001465, 29.706371307373047, 31.001420974731445, 32.296470642089844, 33.591522216796875, 34.886573791503906, 36.18162155151367, 37.4766731262207, 38.77172088623047, 40.0667724609375]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 2.0, 4.0, 5.0, 6.0, 8.0, 11.0, 8.0, 16.0, 15.0, 16.0, 18.0, 16.0, 32.0, 32.0, 38.0, 41.0, 30.0, 34.0, 42.0, 34.0, 44.0, 46.0, 52.0, 34.0, 49.0, 45.0, 34.0, 34.0, 41.0, 24.0, 26.0, 32.0, 22.0, 17.0, 14.0, 16.0, 15.0, 14.0, 9.0, 10.0, 7.0, 7.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.66015625, -4.51409912109375, -4.3680419921875, -4.22198486328125, -4.075927734375, -3.92987060546875, -3.7838134765625, -3.63775634765625, -3.49169921875, -3.34564208984375, -3.1995849609375, -3.05352783203125, -2.907470703125, -2.76141357421875, -2.6153564453125, -2.46929931640625, -2.3232421875, -2.17718505859375, -2.0311279296875, -1.88507080078125, -1.739013671875, -1.59295654296875, -1.4468994140625, -1.30084228515625, -1.15478515625, -1.00872802734375, -0.8626708984375, -0.71661376953125, -0.570556640625, -0.42449951171875, -0.2784423828125, -0.13238525390625, 0.013671875, 0.15972900390625, 0.3057861328125, 0.45184326171875, 0.597900390625, 0.74395751953125, 0.8900146484375, 1.03607177734375, 1.18212890625, 1.32818603515625, 1.4742431640625, 1.62030029296875, 1.766357421875, 1.91241455078125, 2.0584716796875, 2.20452880859375, 2.3505859375, 2.49664306640625, 2.6427001953125, 2.78875732421875, 2.934814453125, 3.08087158203125, 3.2269287109375, 3.37298583984375, 3.51904296875, 3.66510009765625, 3.8111572265625, 3.95721435546875, 4.103271484375, 4.24932861328125, 4.3953857421875, 4.54144287109375, 4.6875]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 5.0, 9.0, 7.0, 4.0, 21.0, 29.0, 53.0, 53.0, 72.0, 130.0, 175.0, 252.0, 346.0, 519.0, 815.0, 1139.0, 1628.0, 2554.0, 3779.0, 5670.0, 8623.0, 13245.0, 20505.0, 32040.0, 50265.0, 80100.0, 123032.0, 169697.0, 172929.0, 127988.0, 84170.0, 52745.0, 33635.0, 21554.0, 13888.0, 8875.0, 5919.0, 3922.0, 2610.0, 1747.0, 1201.0, 825.0, 558.0, 375.0, 286.0, 170.0, 138.0, 88.0, 63.0, 40.0, 24.0, 16.0, 12.0, 8.0, 3.0, 4.0, 3.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.419677734375, -0.4061622619628906, -0.39264678955078125, -0.3791313171386719, -0.3656158447265625, -0.3521003723144531, -0.33858489990234375, -0.3250694274902344, -0.311553955078125, -0.2980384826660156, -0.28452301025390625, -0.2710075378417969, -0.2574920654296875, -0.24397659301757812, -0.23046112060546875, -0.21694564819335938, -0.20343017578125, -0.18991470336914062, -0.17639923095703125, -0.16288375854492188, -0.1493682861328125, -0.13585281372070312, -0.12233734130859375, -0.10882186889648438, -0.095306396484375, -0.08179092407226562, -0.06827545166015625, -0.054759979248046875, -0.0412445068359375, -0.027729034423828125, -0.01421356201171875, -0.000698089599609375, 0.0128173828125, 0.026332855224609375, 0.03984832763671875, 0.053363800048828125, 0.0668792724609375, 0.08039474487304688, 0.09391021728515625, 0.10742568969726562, 0.120941162109375, 0.13445663452148438, 0.14797210693359375, 0.16148757934570312, 0.1750030517578125, 0.18851852416992188, 0.20203399658203125, 0.21554946899414062, 0.22906494140625, 0.24258041381835938, 0.25609588623046875, 0.2696113586425781, 0.2831268310546875, 0.2966423034667969, 0.31015777587890625, 0.3236732482910156, 0.337188720703125, 0.3507041931152344, 0.36421966552734375, 0.3777351379394531, 0.3912506103515625, 0.4047660827636719, 0.41828155517578125, 0.4317970275878906, 0.4453125]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 5.0, 3.0, 6.0, 5.0, 8.0, 13.0, 15.0, 13.0, 22.0, 18.0, 21.0, 26.0, 32.0, 33.0, 33.0, 38.0, 29.0, 35.0, 47.0, 38.0, 47.0, 1063.0, 39.0, 45.0, 38.0, 33.0, 37.0, 44.0, 39.0, 31.0, 25.0, 20.0, 23.0, 19.0, 17.0, 10.0, 16.0, 8.0, 8.0, 10.0, 5.0, 2.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.68359375, -2.59228515625, -2.5009765625, -2.40966796875, -2.318359375, -2.22705078125, -2.1357421875, -2.04443359375, -1.953125, -1.86181640625, -1.7705078125, -1.67919921875, -1.587890625, -1.49658203125, -1.4052734375, -1.31396484375, -1.22265625, -1.13134765625, -1.0400390625, -0.94873046875, -0.857421875, -0.76611328125, -0.6748046875, -0.58349609375, -0.4921875, -0.40087890625, -0.3095703125, -0.21826171875, -0.126953125, -0.03564453125, 0.0556640625, 0.14697265625, 0.23828125, 0.32958984375, 0.4208984375, 0.51220703125, 0.603515625, 0.69482421875, 0.7861328125, 0.87744140625, 0.96875, 1.06005859375, 1.1513671875, 1.24267578125, 1.333984375, 1.42529296875, 1.5166015625, 1.60791015625, 1.69921875, 1.79052734375, 1.8818359375, 1.97314453125, 2.064453125, 2.15576171875, 2.2470703125, 2.33837890625, 2.4296875, 2.52099609375, 2.6123046875, 2.70361328125, 2.794921875, 2.88623046875, 2.9775390625, 3.06884765625, 3.16015625]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0, 10.0, 11.0, 16.0, 32.0, 60.0, 93.0, 149.0, 220.0, 444.0, 741.0, 1259.0, 2210.0, 3875.0, 6876.0, 11823.0, 20662.0, 35539.0, 60717.0, 100157.0, 152237.0, 1236607.0, 170079.0, 118305.0, 72792.0, 42961.0, 25182.0, 14531.0, 8331.0, 4729.0, 2736.0, 1624.0, 896.0, 495.0, 324.0, 160.0, 113.0, 58.0, 30.0, 18.0, 13.0, 11.0, 6.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.430908203125, -0.41883087158203125, -0.4067535400390625, -0.39467620849609375, -0.382598876953125, -0.37052154541015625, -0.3584442138671875, -0.34636688232421875, -0.33428955078125, -0.32221221923828125, -0.3101348876953125, -0.29805755615234375, -0.285980224609375, -0.27390289306640625, -0.2618255615234375, -0.24974822998046875, -0.2376708984375, -0.22559356689453125, -0.2135162353515625, -0.20143890380859375, -0.189361572265625, -0.17728424072265625, -0.1652069091796875, -0.15312957763671875, -0.14105224609375, -0.12897491455078125, -0.1168975830078125, -0.10482025146484375, -0.092742919921875, -0.08066558837890625, -0.0685882568359375, -0.05651092529296875, -0.04443359375, -0.03235626220703125, -0.0202789306640625, -0.00820159912109375, 0.003875732421875, 0.01595306396484375, 0.0280303955078125, 0.04010772705078125, 0.05218505859375, 0.06426239013671875, 0.0763397216796875, 0.08841705322265625, 0.100494384765625, 0.11257171630859375, 0.1246490478515625, 0.13672637939453125, 0.1488037109375, 0.16088104248046875, 0.1729583740234375, 0.18503570556640625, 0.197113037109375, 0.20919036865234375, 0.2212677001953125, 0.23334503173828125, 0.24542236328125, 0.25749969482421875, 0.2695770263671875, 0.28165435791015625, 0.293731689453125, 0.30580902099609375, 0.3178863525390625, 0.32996368408203125, 0.342041015625]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 7.0, 3.0, 5.0, 10.0, 14.0, 17.0, 10.0, 18.0, 16.0, 14.0, 23.0, 41.0, 48.0, 51.0, 56.0, 58.0, 69.0, 67.0, 66.0, 72.0, 67.0, 43.0, 46.0, 41.0, 35.0, 20.0, 22.0, 15.0, 8.0, 14.0, 6.0, 1.0, 5.0, 3.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0036411285400390625, -0.0035358965396881104, -0.003430664539337158, -0.003325432538986206, -0.003220200538635254, -0.0031149685382843018, -0.0030097365379333496, -0.0029045045375823975, -0.0027992725372314453, -0.002694040536880493, -0.002588808536529541, -0.002483576536178589, -0.0023783445358276367, -0.0022731125354766846, -0.0021678805351257324, -0.0020626485347747803, -0.001957416534423828, -0.001852184534072876, -0.0017469525337219238, -0.0016417205333709717, -0.0015364885330200195, -0.0014312565326690674, -0.0013260245323181152, -0.001220792531967163, -0.001115560531616211, -0.0010103285312652588, -0.0009050965309143066, -0.0007998645305633545, -0.0006946325302124023, -0.0005894005298614502, -0.00048416852951049805, -0.0003789365291595459, -0.00027370452880859375, -0.0001684725284576416, -6.324052810668945e-05, 4.1991472244262695e-05, 0.00014722347259521484, 0.000252455472946167, 0.00035768747329711914, 0.0004629194736480713, 0.0005681514739990234, 0.0006733834743499756, 0.0007786154747009277, 0.0008838474750518799, 0.000989079475402832, 0.0010943114757537842, 0.0011995434761047363, 0.0013047754764556885, 0.0014100074768066406, 0.0015152394771575928, 0.001620471477508545, 0.001725703477859497, 0.0018309354782104492, 0.0019361674785614014, 0.0020413994789123535, 0.0021466314792633057, 0.002251863479614258, 0.00235709547996521, 0.002462327480316162, 0.0025675594806671143, 0.0026727914810180664, 0.0027780234813690186, 0.0028832554817199707, 0.002988487482070923, 0.003093719482421875]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 6.0, 8.0, 7.0, 8.0, 13.0, 18.0, 30.0, 39.0, 44.0, 57.0, 71.0, 81.0, 84.0, 143.0, 204.0, 391.0, 770.0, 17784.0, 1021439.0, 5634.0, 619.0, 292.0, 227.0, 152.0, 103.0, 81.0, 55.0, 49.0, 36.0, 21.0, 25.0, 9.0, 14.0, 10.0, 4.0, 9.0, 8.0, 3.0, 3.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.058502197265625, -0.05663871765136719, -0.054775238037109375, -0.05291175842285156, -0.05104827880859375, -0.04918479919433594, -0.047321319580078125, -0.04545783996582031, -0.0435943603515625, -0.04173088073730469, -0.039867401123046875, -0.03800392150878906, -0.03614044189453125, -0.03427696228027344, -0.032413482666015625, -0.030550003051757812, -0.0286865234375, -0.026823043823242188, -0.024959564208984375, -0.023096084594726562, -0.02123260498046875, -0.019369125366210938, -0.017505645751953125, -0.015642166137695312, -0.0137786865234375, -0.011915206909179688, -0.010051727294921875, -0.008188247680664062, -0.00632476806640625, -0.0044612884521484375, -0.002597808837890625, -0.0007343292236328125, 0.001129150390625, 0.0029926300048828125, 0.004856109619140625, 0.0067195892333984375, 0.00858306884765625, 0.010446548461914062, 0.012310028076171875, 0.014173507690429688, 0.0160369873046875, 0.017900466918945312, 0.019763946533203125, 0.021627426147460938, 0.02349090576171875, 0.025354385375976562, 0.027217864990234375, 0.029081344604492188, 0.03094482421875, 0.03280830383300781, 0.034671783447265625, 0.03653526306152344, 0.03839874267578125, 0.04026222229003906, 0.042125701904296875, 0.04398918151855469, 0.0458526611328125, 0.04771614074707031, 0.049579620361328125, 0.05144309997558594, 0.05330657958984375, 0.05517005920410156, 0.057033538818359375, 0.05889701843261719, 0.060760498046875]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1005.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.037998151034116745, -0.036793846637010574, -0.035589538514614105, -0.034385234117507935, -0.033180929720401764, -0.03197662532329559, -0.030772319063544273, -0.029568012803792953, -0.028363708406686783, -0.027159404009580612, -0.025955097749829292, -0.024750791490077972, -0.023546487092971802, -0.02234218269586563, -0.02113787643611431, -0.01993357017636299, -0.01872926577925682, -0.01752496138215065, -0.01632065512239933, -0.015116349793970585, -0.01391204446554184, -0.012707739137113094, -0.011503433808684349, -0.010299128480255604, -0.009094823151826859, -0.007890517823398113, -0.006686212494969368, -0.005481907166540623, -0.0042776018381118774, -0.003073296509683132, -0.001868991181254387, -0.0006646858528256416, 0.0005396232008934021, 0.0017439285293221474, 0.0029482338577508926, 0.004152539186179638, 0.005356844514608383, 0.0065611498430371284, 0.007765455171465874, 0.008969760499894619, 0.010174065828323364, 0.01137837115675211, 0.012582676485180855, 0.0137869818136096, 0.014991287142038345, 0.016195591539144516, 0.017399897798895836, 0.018604204058647156, 0.019808508455753326, 0.021012812852859497, 0.022217119112610817, 0.023421425372362137, 0.024625729769468307, 0.025830034166574478, 0.027034340426325798, 0.028238646686077118, 0.02944295108318329, 0.03064725548028946, 0.03185155987739563, 0.0330558679997921, 0.03426017239689827, 0.03546447679400444, 0.03666878491640091, 0.03787308931350708, 0.03907739371061325]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 5.0, 8.0, 7.0, 14.0, 18.0, 12.0, 32.0, 23.0, 26.0, 32.0, 35.0, 51.0, 58.0, 44.0, 44.0, 62.0, 52.0, 52.0, 63.0, 47.0, 64.0, 41.0, 39.0, 32.0, 22.0, 22.0, 28.0, 16.0, 21.0, 4.0, 13.0, 7.0, 4.0, 7.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0018758773803710938, -0.001799331046640873, -0.0017227847129106522, -0.0016462383791804314, -0.0015696920454502106, -0.0014931457117199898, -0.001416599377989769, -0.0013400530442595482, -0.0012635067105293274, -0.0011869603767991066, -0.0011104140430688858, -0.001033867709338665, -0.0009573213756084442, -0.0008807750418782234, -0.0008042287081480026, -0.0007276823744177818, -0.000651136040687561, -0.0005745897069573402, -0.0004980433732271194, -0.00042149703949689865, -0.00034495070576667786, -0.00026840437203645706, -0.00019185803830623627, -0.00011531170457601547, -3.876537084579468e-05, 3.778096288442612e-05, 0.00011432729661464691, 0.0001908736303448677, 0.0002674199640750885, 0.0003439662978053093, 0.0004205126315355301, 0.0004970589652657509, 0.0005736052989959717, 0.0006501516327261925, 0.0007266979664564133, 0.0008032443001866341, 0.0008797906339168549, 0.0009563369676470757, 0.0010328833013772964, 0.0011094296351075172, 0.001185975968837738, 0.0012625223025679588, 0.0013390686362981796, 0.0014156149700284004, 0.0014921613037586212, 0.001568707637488842, 0.0016452539712190628, 0.0017218003049492836, 0.0017983466386795044, 0.0018748929724097252, 0.001951439306139946, 0.0020279856398701668, 0.0021045319736003876, 0.0021810783073306084, 0.002257624641060829, 0.00233417097479105, 0.0024107173085212708, 0.0024872636422514915, 0.0025638099759817123, 0.002640356309711933, 0.002716902643442154, 0.0027934489771723747, 0.0028699953109025955, 0.0029465416446328163, 0.003023087978363037]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 2.0, 4.0, 5.0, 6.0, 8.0, 11.0, 8.0, 16.0, 15.0, 16.0, 18.0, 16.0, 32.0, 32.0, 38.0, 41.0, 30.0, 34.0, 42.0, 34.0, 44.0, 46.0, 52.0, 34.0, 49.0, 45.0, 34.0, 34.0, 41.0, 24.0, 26.0, 32.0, 22.0, 17.0, 14.0, 16.0, 15.0, 14.0, 9.0, 10.0, 7.0, 7.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.66015625, -4.51409912109375, -4.3680419921875, -4.22198486328125, -4.075927734375, -3.92987060546875, -3.7838134765625, -3.63775634765625, -3.49169921875, -3.34564208984375, -3.1995849609375, -3.05352783203125, -2.907470703125, -2.76141357421875, -2.6153564453125, -2.46929931640625, -2.3232421875, -2.17718505859375, -2.0311279296875, -1.88507080078125, -1.739013671875, -1.59295654296875, -1.4468994140625, -1.30084228515625, -1.15478515625, -1.00872802734375, -0.8626708984375, -0.71661376953125, -0.570556640625, -0.42449951171875, -0.2784423828125, -0.13238525390625, 0.013671875, 0.15972900390625, 0.3057861328125, 0.45184326171875, 0.597900390625, 0.74395751953125, 0.8900146484375, 1.03607177734375, 1.18212890625, 1.32818603515625, 1.4742431640625, 1.62030029296875, 1.766357421875, 1.91241455078125, 2.0584716796875, 2.20452880859375, 2.3505859375, 2.49664306640625, 2.6427001953125, 2.78875732421875, 2.934814453125, 3.08087158203125, 3.2269287109375, 3.37298583984375, 3.51904296875, 3.66510009765625, 3.8111572265625, 3.95721435546875, 4.103271484375, 4.24932861328125, 4.3953857421875, 4.54144287109375, 4.6875]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 8.0, 8.0, 7.0, 10.0, 19.0, 26.0, 21.0, 42.0, 72.0, 92.0, 119.0, 163.0, 315.0, 436.0, 793.0, 1325.0, 2596.0, 5159.0, 10176.0, 23638.0, 66454.0, 252070.0, 480102.0, 133026.0, 40169.0, 15739.0, 7454.0, 3741.0, 1938.0, 1057.0, 622.0, 398.0, 244.0, 136.0, 115.0, 91.0, 53.0, 36.0, 31.0, 20.0, 18.0, 3.0, 8.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.390625, -3.288726806640625, -3.18682861328125, -3.084930419921875, -2.9830322265625, -2.881134033203125, -2.77923583984375, -2.677337646484375, -2.575439453125, -2.473541259765625, -2.37164306640625, -2.269744873046875, -2.1678466796875, -2.065948486328125, -1.96405029296875, -1.862152099609375, -1.76025390625, -1.658355712890625, -1.55645751953125, -1.454559326171875, -1.3526611328125, -1.250762939453125, -1.14886474609375, -1.046966552734375, -0.945068359375, -0.843170166015625, -0.74127197265625, -0.639373779296875, -0.5374755859375, -0.435577392578125, -0.33367919921875, -0.231781005859375, -0.1298828125, -0.027984619140625, 0.07391357421875, 0.175811767578125, 0.2777099609375, 0.379608154296875, 0.48150634765625, 0.583404541015625, 0.685302734375, 0.787200927734375, 0.88909912109375, 0.990997314453125, 1.0928955078125, 1.194793701171875, 1.29669189453125, 1.398590087890625, 1.50048828125, 1.602386474609375, 1.70428466796875, 1.806182861328125, 1.9080810546875, 2.009979248046875, 2.11187744140625, 2.213775634765625, 2.315673828125, 2.417572021484375, 2.51947021484375, 2.621368408203125, 2.7232666015625, 2.825164794921875, 2.92706298828125, 3.028961181640625, 3.130859375]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 3.0, 3.0, 7.0, 4.0, 6.0, 19.0, 17.0, 16.0, 24.0, 23.0, 25.0, 37.0, 28.0, 32.0, 45.0, 46.0, 44.0, 64.0, 77.0, 1697.0, 313.0, 75.0, 62.0, 50.0, 53.0, 49.0, 37.0, 33.0, 29.0, 26.0, 22.0, 22.0, 12.0, 15.0, 10.0, 10.0, 11.0, 4.0, 2.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-18.34375, -17.8177490234375, -17.291748046875, -16.7657470703125, -16.23974609375, -15.7137451171875, -15.187744140625, -14.6617431640625, -14.1357421875, -13.6097412109375, -13.083740234375, -12.5577392578125, -12.03173828125, -11.5057373046875, -10.979736328125, -10.4537353515625, -9.927734375, -9.4017333984375, -8.875732421875, -8.3497314453125, -7.82373046875, -7.2977294921875, -6.771728515625, -6.2457275390625, -5.7197265625, -5.1937255859375, -4.667724609375, -4.1417236328125, -3.61572265625, -3.0897216796875, -2.563720703125, -2.0377197265625, -1.51171875, -0.9857177734375, -0.459716796875, 0.0662841796875, 0.59228515625, 1.1182861328125, 1.644287109375, 2.1702880859375, 2.6962890625, 3.2222900390625, 3.748291015625, 4.2742919921875, 4.80029296875, 5.3262939453125, 5.852294921875, 6.3782958984375, 6.904296875, 7.4302978515625, 7.956298828125, 8.4822998046875, 9.00830078125, 9.5343017578125, 10.060302734375, 10.5863037109375, 11.1123046875, 11.6383056640625, 12.164306640625, 12.6903076171875, 13.21630859375, 13.7423095703125, 14.268310546875, 14.7943115234375, 15.3203125]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 7.0, 2.0, 2.0, 3.0, 12.0, 13.0, 8.0, 5.0, 15.0, 25.0, 18.0, 29.0, 36.0, 33.0, 52.0, 95.0, 114.0, 191.0, 376.0, 934.0, 3434.0, 76101.0, 3043765.0, 16947.0, 2014.0, 640.0, 267.0, 156.0, 111.0, 56.0, 41.0, 50.0, 24.0, 26.0, 24.0, 20.0, 18.0, 13.0, 13.0, 2.0, 10.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.703125, -23.914306640625, -23.12548828125, -22.336669921875, -21.5478515625, -20.759033203125, -19.97021484375, -19.181396484375, -18.392578125, -17.603759765625, -16.81494140625, -16.026123046875, -15.2373046875, -14.448486328125, -13.65966796875, -12.870849609375, -12.08203125, -11.293212890625, -10.50439453125, -9.715576171875, -8.9267578125, -8.137939453125, -7.34912109375, -6.560302734375, -5.771484375, -4.982666015625, -4.19384765625, -3.405029296875, -2.6162109375, -1.827392578125, -1.03857421875, -0.249755859375, 0.5390625, 1.327880859375, 2.11669921875, 2.905517578125, 3.6943359375, 4.483154296875, 5.27197265625, 6.060791015625, 6.849609375, 7.638427734375, 8.42724609375, 9.216064453125, 10.0048828125, 10.793701171875, 11.58251953125, 12.371337890625, 13.16015625, 13.948974609375, 14.73779296875, 15.526611328125, 16.3154296875, 17.104248046875, 17.89306640625, 18.681884765625, 19.470703125, 20.259521484375, 21.04833984375, 21.837158203125, 22.6259765625, 23.414794921875, 24.20361328125, 24.992431640625, 25.78125]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 9.0, 126.0, 715.0, 159.0, 8.0], "bins": [-174.2695770263672, -171.43614196777344, -168.60269165039062, -165.76925659179688, -162.93580627441406, -160.1023712158203, -157.2689208984375, -154.43548583984375, -151.60205078125, -148.76861572265625, -145.93516540527344, -143.1017303466797, -140.26828002929688, -137.43484497070312, -134.60140991210938, -131.76795959472656, -128.93450927734375, -126.10106658935547, -123.26762390136719, -120.43418884277344, -117.60074615478516, -114.76730346679688, -111.9338607788086, -109.10041809082031, -106.26698303222656, -103.43354034423828, -100.60009765625, -97.76666259765625, -94.93321990966797, -92.09977722167969, -89.2663345336914, -86.43289184570312, -83.59944915771484, -80.76600646972656, -77.93256378173828, -75.09912109375, -72.26568603515625, -69.43224334716797, -66.59880065917969, -63.765357971191406, -60.93191909790039, -58.09847640991211, -55.265037536621094, -52.43159484863281, -49.59815216064453, -46.76470947265625, -43.931270599365234, -41.09782791137695, -38.26438903808594, -35.430946350097656, -32.59750747680664, -29.76406478881836, -26.930622100830078, -24.09718132019043, -21.26374053955078, -18.4302978515625, -15.596856117248535, -12.76341438293457, -9.929973602294922, -7.096531867980957, -4.263090133666992, -1.4296483993530273, 1.403792381286621, 4.237235069274902, 7.070675849914551]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 3.0, 4.0, 5.0, 6.0, 9.0, 8.0, 9.0, 12.0, 22.0, 20.0, 26.0, 17.0, 22.0, 18.0, 20.0, 28.0, 28.0, 36.0, 28.0, 27.0, 38.0, 31.0, 40.0, 31.0, 46.0, 38.0, 40.0, 33.0, 33.0, 34.0, 25.0, 32.0, 20.0, 19.0, 19.0, 20.0, 21.0, 17.0, 12.0, 20.0, 19.0, 11.0, 10.0, 11.0, 12.0, 7.0, 5.0, 3.0, 3.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0], "bins": [-44.84918212890625, -43.43840789794922, -42.02763748168945, -40.61686325073242, -39.206092834472656, -37.795318603515625, -36.384544372558594, -34.97377014160156, -33.5629997253418, -32.152225494384766, -30.741455078125, -29.33068084716797, -27.91990852355957, -26.509136199951172, -25.09836196899414, -23.687589645385742, -22.276817321777344, -20.866044998168945, -19.455272674560547, -18.044498443603516, -16.633726119995117, -15.222953796386719, -13.812180519104004, -12.401407241821289, -10.99063491821289, -9.579862594604492, -8.169089317321777, -6.758316516876221, -5.347543716430664, -3.9367709159851074, -2.525998115539551, -1.115224838256836, 0.2955513000488281, 1.7063241004943848, 3.1170969009399414, 4.527869701385498, 5.938642501831055, 7.349415302276611, 8.760188102722168, 10.170961380004883, 11.581733703613281, 12.99250602722168, 14.403279304504395, 15.81405258178711, 17.224824905395508, 18.635597229003906, 20.046371459960938, 21.457143783569336, 22.867916107177734, 24.278688430786133, 25.68946075439453, 27.100234985351562, 28.51100730895996, 29.92177963256836, 31.33255386352539, 32.743324279785156, 34.15409851074219, 35.56487274169922, 36.975643157958984, 38.386417388916016, 39.79718780517578, 41.20796203613281, 42.618736267089844, 44.029510498046875, 45.44028091430664]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 3.0, 3.0, 6.0, 8.0, 13.0, 10.0, 7.0, 17.0, 19.0, 12.0, 22.0, 32.0, 21.0, 36.0, 42.0, 31.0, 35.0, 40.0, 45.0, 41.0, 34.0, 47.0, 44.0, 43.0, 44.0, 44.0, 33.0, 36.0, 26.0, 33.0, 26.0, 24.0, 18.0, 9.0, 18.0, 18.0, 16.0, 10.0, 11.0, 6.0, 12.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.63671875, -4.48858642578125, -4.3404541015625, -4.19232177734375, -4.044189453125, -3.89605712890625, -3.7479248046875, -3.59979248046875, -3.45166015625, -3.30352783203125, -3.1553955078125, -3.00726318359375, -2.859130859375, -2.71099853515625, -2.5628662109375, -2.41473388671875, -2.2666015625, -2.11846923828125, -1.9703369140625, -1.82220458984375, -1.674072265625, -1.52593994140625, -1.3778076171875, -1.22967529296875, -1.08154296875, -0.93341064453125, -0.7852783203125, -0.63714599609375, -0.489013671875, -0.34088134765625, -0.1927490234375, -0.04461669921875, 0.103515625, 0.25164794921875, 0.3997802734375, 0.54791259765625, 0.696044921875, 0.84417724609375, 0.9923095703125, 1.14044189453125, 1.28857421875, 1.43670654296875, 1.5848388671875, 1.73297119140625, 1.881103515625, 2.02923583984375, 2.1773681640625, 2.32550048828125, 2.4736328125, 2.62176513671875, 2.7698974609375, 2.91802978515625, 3.066162109375, 3.21429443359375, 3.3624267578125, 3.51055908203125, 3.65869140625, 3.80682373046875, 3.9549560546875, 4.10308837890625, 4.251220703125, 4.39935302734375, 4.5474853515625, 4.69561767578125, 4.84375]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 3.0, 2.0, 2.0, 3.0, 2.0, 4.0, 8.0, 7.0, 11.0, 6.0, 10.0, 17.0, 25.0, 28.0, 36.0, 45.0, 82.0, 131.0, 204.0, 382.0, 822.0, 1605.0, 3658.0, 9587.0, 28481.0, 109746.0, 721311.0, 2282006.0, 857762.0, 129653.0, 31958.0, 9862.0, 3672.0, 1545.0, 717.0, 363.0, 170.0, 111.0, 68.0, 41.0, 34.0, 21.0, 21.0, 19.0, 15.0, 12.0, 10.0, 3.0, 4.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.6015625, -8.3104248046875, -8.019287109375, -7.7281494140625, -7.43701171875, -7.1458740234375, -6.854736328125, -6.5635986328125, -6.2724609375, -5.9813232421875, -5.690185546875, -5.3990478515625, -5.10791015625, -4.8167724609375, -4.525634765625, -4.2344970703125, -3.943359375, -3.6522216796875, -3.361083984375, -3.0699462890625, -2.77880859375, -2.4876708984375, -2.196533203125, -1.9053955078125, -1.6142578125, -1.3231201171875, -1.031982421875, -0.7408447265625, -0.44970703125, -0.1585693359375, 0.132568359375, 0.4237060546875, 0.71484375, 1.0059814453125, 1.297119140625, 1.5882568359375, 1.87939453125, 2.1705322265625, 2.461669921875, 2.7528076171875, 3.0439453125, 3.3350830078125, 3.626220703125, 3.9173583984375, 4.20849609375, 4.4996337890625, 4.790771484375, 5.0819091796875, 5.373046875, 5.6641845703125, 5.955322265625, 6.2464599609375, 6.53759765625, 6.8287353515625, 7.119873046875, 7.4110107421875, 7.7021484375, 7.9932861328125, 8.284423828125, 8.5755615234375, 8.86669921875, 9.1578369140625, 9.448974609375, 9.7401123046875, 10.03125]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 8.0, 9.0, 21.0, 22.0, 41.0, 60.0, 55.0, 107.0, 141.0, 205.0, 328.0, 422.0, 543.0, 616.0, 461.0, 325.0, 235.0, 164.0, 102.0, 71.0, 48.0, 29.0, 21.0, 13.0, 9.0, 3.0, 4.0, 4.0, 2.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.109375, -16.607666015625, -16.10595703125, -15.604248046875, -15.1025390625, -14.600830078125, -14.09912109375, -13.597412109375, -13.095703125, -12.593994140625, -12.09228515625, -11.590576171875, -11.0888671875, -10.587158203125, -10.08544921875, -9.583740234375, -9.08203125, -8.580322265625, -8.07861328125, -7.576904296875, -7.0751953125, -6.573486328125, -6.07177734375, -5.570068359375, -5.068359375, -4.566650390625, -4.06494140625, -3.563232421875, -3.0615234375, -2.559814453125, -2.05810546875, -1.556396484375, -1.0546875, -0.552978515625, -0.05126953125, 0.450439453125, 0.9521484375, 1.453857421875, 1.95556640625, 2.457275390625, 2.958984375, 3.460693359375, 3.96240234375, 4.464111328125, 4.9658203125, 5.467529296875, 5.96923828125, 6.470947265625, 6.97265625, 7.474365234375, 7.97607421875, 8.477783203125, 8.9794921875, 9.481201171875, 9.98291015625, 10.484619140625, 10.986328125, 11.488037109375, 11.98974609375, 12.491455078125, 12.9931640625, 13.494873046875, 13.99658203125, 14.498291015625, 15.0]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 7.0, 2.0, 1.0, 7.0, 11.0, 15.0, 9.0, 18.0, 20.0, 25.0, 37.0, 43.0, 82.0, 88.0, 101.0, 194.0, 339.0, 556.0, 1379.0, 5073.0, 35135.0, 580777.0, 3369238.0, 179804.0, 16087.0, 2990.0, 920.0, 431.0, 251.0, 180.0, 113.0, 88.0, 53.0, 48.0, 28.0, 34.0, 22.0, 12.0, 11.0, 11.0, 8.0, 8.0, 5.0, 7.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0], "bins": [-29.046875, -28.119384765625, -27.19189453125, -26.264404296875, -25.3369140625, -24.409423828125, -23.48193359375, -22.554443359375, -21.626953125, -20.699462890625, -19.77197265625, -18.844482421875, -17.9169921875, -16.989501953125, -16.06201171875, -15.134521484375, -14.20703125, -13.279541015625, -12.35205078125, -11.424560546875, -10.4970703125, -9.569580078125, -8.64208984375, -7.714599609375, -6.787109375, -5.859619140625, -4.93212890625, -4.004638671875, -3.0771484375, -2.149658203125, -1.22216796875, -0.294677734375, 0.6328125, 1.560302734375, 2.48779296875, 3.415283203125, 4.3427734375, 5.270263671875, 6.19775390625, 7.125244140625, 8.052734375, 8.980224609375, 9.90771484375, 10.835205078125, 11.7626953125, 12.690185546875, 13.61767578125, 14.545166015625, 15.47265625, 16.400146484375, 17.32763671875, 18.255126953125, 19.1826171875, 20.110107421875, 21.03759765625, 21.965087890625, 22.892578125, 23.820068359375, 24.74755859375, 25.675048828125, 26.6025390625, 27.530029296875, 28.45751953125, 29.385009765625, 30.3125]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 5.0, 12.0, 24.0, 32.0, 69.0, 100.0, 124.0, 140.0, 155.0, 119.0, 108.0, 62.0, 26.0, 14.0, 12.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-76.81227111816406, -74.55052185058594, -72.28877258300781, -70.02702331542969, -67.76527404785156, -65.50352478027344, -63.24177932739258, -60.98003005981445, -58.71828079223633, -56.4565315246582, -54.19478225708008, -51.93303298950195, -49.671287536621094, -47.40953826904297, -45.147789001464844, -42.88603973388672, -40.624290466308594, -38.36254119873047, -36.100791931152344, -33.83904266357422, -31.577295303344727, -29.3155460357666, -27.05379867553711, -24.792049407958984, -22.53030014038086, -20.268550872802734, -18.00680160522461, -15.745054244995117, -13.483304977416992, -11.221555709838867, -8.959807395935059, -6.69805908203125, -4.436309814453125, -2.174561023712158, 0.0871877670288086, 2.3489365577697754, 4.610685348510742, 6.872434616088867, 9.134182929992676, 11.395931243896484, 13.65768051147461, 15.919429779052734, 18.18117904663086, 20.44292640686035, 22.704675674438477, 24.9664249420166, 27.228172302246094, 29.48992156982422, 31.751670837402344, 34.01342010498047, 36.275169372558594, 38.53691864013672, 40.798667907714844, 43.06041717529297, 45.32216262817383, 47.58391189575195, 49.84566116333008, 52.1074104309082, 54.36915969848633, 56.63090896606445, 58.89265441894531, 61.15440368652344, 63.41615295410156, 65.67790222167969, 67.93965148925781]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 2.0, 1.0, 7.0, 7.0, 6.0, 5.0, 8.0, 16.0, 13.0, 26.0, 20.0, 22.0, 30.0, 35.0, 34.0, 33.0, 37.0, 39.0, 37.0, 38.0, 51.0, 39.0, 46.0, 42.0, 57.0, 53.0, 44.0, 28.0, 42.0, 32.0, 32.0, 19.0, 20.0, 13.0, 19.0, 15.0, 7.0, 5.0, 7.0, 4.0, 4.0, 0.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.31919860839844, -41.86086654663086, -40.402530670166016, -38.94419860839844, -37.485862731933594, -36.027530670166016, -34.56919860839844, -33.110862731933594, -31.652528762817383, -30.194194793701172, -28.73586082458496, -27.27752685546875, -25.819194793701172, -24.360858917236328, -22.90252685546875, -21.44419288635254, -19.985858917236328, -18.527524948120117, -17.069190979003906, -15.610857963562012, -14.1525239944458, -12.69419002532959, -11.235857009887695, -9.777523040771484, -8.319189071655273, -6.8608551025390625, -5.40252161026001, -3.944188117980957, -2.485854148864746, -1.0275201797485352, 0.4308128356933594, 1.8891468048095703, 3.3474807739257812, 4.805814743041992, 6.264148235321045, 7.722481727600098, 9.180815696716309, 10.63914966583252, 12.097482681274414, 13.555816650390625, 15.014150619506836, 16.472484588623047, 17.930818557739258, 19.38915252685547, 20.847484588623047, 22.30582046508789, 23.76415252685547, 25.22248649597168, 26.68082046508789, 28.1391544342041, 29.597488403320312, 31.05582046508789, 32.514156341552734, 33.97248840332031, 35.430824279785156, 36.889156341552734, 38.34748840332031, 39.80582046508789, 41.264156341552734, 42.72248840332031, 44.180824279785156, 45.639156341552734, 47.09748840332031, 48.555824279785156, 50.01416015625]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 5.0, 4.0, 9.0, 7.0, 6.0, 19.0, 19.0, 13.0, 18.0, 32.0, 21.0, 31.0, 33.0, 24.0, 36.0, 40.0, 48.0, 49.0, 47.0, 48.0, 38.0, 39.0, 41.0, 35.0, 46.0, 33.0, 37.0, 31.0, 32.0, 33.0, 24.0, 18.0, 21.0, 10.0, 13.0, 3.0, 13.0, 10.0, 8.0, 2.0, 4.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.50390625, -5.34686279296875, -5.1898193359375, -5.03277587890625, -4.875732421875, -4.71868896484375, -4.5616455078125, -4.40460205078125, -4.24755859375, -4.09051513671875, -3.9334716796875, -3.77642822265625, -3.619384765625, -3.46234130859375, -3.3052978515625, -3.14825439453125, -2.9912109375, -2.83416748046875, -2.6771240234375, -2.52008056640625, -2.363037109375, -2.20599365234375, -2.0489501953125, -1.89190673828125, -1.73486328125, -1.57781982421875, -1.4207763671875, -1.26373291015625, -1.106689453125, -0.94964599609375, -0.7926025390625, -0.63555908203125, -0.478515625, -0.32147216796875, -0.1644287109375, -0.00738525390625, 0.149658203125, 0.30670166015625, 0.4637451171875, 0.62078857421875, 0.77783203125, 0.93487548828125, 1.0919189453125, 1.24896240234375, 1.406005859375, 1.56304931640625, 1.7200927734375, 1.87713623046875, 2.0341796875, 2.19122314453125, 2.3482666015625, 2.50531005859375, 2.662353515625, 2.81939697265625, 2.9764404296875, 3.13348388671875, 3.29052734375, 3.44757080078125, 3.6046142578125, 3.76165771484375, 3.918701171875, 4.07574462890625, 4.2327880859375, 4.38983154296875, 4.546875]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 6.0, 3.0, 16.0, 18.0, 8.0, 31.0, 34.0, 51.0, 74.0, 88.0, 124.0, 180.0, 267.0, 400.0, 568.0, 803.0, 1150.0, 1713.0, 2478.0, 3857.0, 5902.0, 9038.0, 13980.0, 22122.0, 34545.0, 55387.0, 87665.0, 132525.0, 173248.0, 165699.0, 120940.0, 78440.0, 49300.0, 31134.0, 19910.0, 12512.0, 8047.0, 5270.0, 3525.0, 2342.0, 1578.0, 1068.0, 762.0, 512.0, 346.0, 260.0, 187.0, 137.0, 89.0, 56.0, 47.0, 38.0, 28.0, 21.0, 9.0, 11.0, 5.0, 7.0, 5.0, 3.0, 0.0, 1.0], "bins": [-0.458251953125, -0.44341278076171875, -0.4285736083984375, -0.41373443603515625, -0.398895263671875, -0.38405609130859375, -0.3692169189453125, -0.35437774658203125, -0.33953857421875, -0.32469940185546875, -0.3098602294921875, -0.29502105712890625, -0.280181884765625, -0.26534271240234375, -0.2505035400390625, -0.23566436767578125, -0.2208251953125, -0.20598602294921875, -0.1911468505859375, -0.17630767822265625, -0.161468505859375, -0.14662933349609375, -0.1317901611328125, -0.11695098876953125, -0.10211181640625, -0.08727264404296875, -0.0724334716796875, -0.05759429931640625, -0.042755126953125, -0.02791595458984375, -0.0130767822265625, 0.00176239013671875, 0.0166015625, 0.03144073486328125, 0.0462799072265625, 0.06111907958984375, 0.075958251953125, 0.09079742431640625, 0.1056365966796875, 0.12047576904296875, 0.13531494140625, 0.15015411376953125, 0.1649932861328125, 0.17983245849609375, 0.194671630859375, 0.20951080322265625, 0.2243499755859375, 0.23918914794921875, 0.2540283203125, 0.26886749267578125, 0.2837066650390625, 0.29854583740234375, 0.313385009765625, 0.32822418212890625, 0.3430633544921875, 0.35790252685546875, 0.37274169921875, 0.38758087158203125, 0.4024200439453125, 0.41725921630859375, 0.432098388671875, 0.44693756103515625, 0.4617767333984375, 0.47661590576171875, 0.491455078125]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 10.0, 5.0, 6.0, 7.0, 12.0, 15.0, 20.0, 24.0, 31.0, 26.0, 32.0, 37.0, 42.0, 45.0, 39.0, 56.0, 48.0, 1065.0, 51.0, 63.0, 57.0, 55.0, 41.0, 39.0, 30.0, 25.0, 36.0, 29.0, 29.0, 18.0, 13.0, 15.0, 3.0, 1.0, 1.0, 4.0, 1.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.046875, -3.923858642578125, -3.80084228515625, -3.677825927734375, -3.5548095703125, -3.431793212890625, -3.30877685546875, -3.185760498046875, -3.062744140625, -2.939727783203125, -2.81671142578125, -2.693695068359375, -2.5706787109375, -2.447662353515625, -2.32464599609375, -2.201629638671875, -2.07861328125, -1.955596923828125, -1.83258056640625, -1.709564208984375, -1.5865478515625, -1.463531494140625, -1.34051513671875, -1.217498779296875, -1.094482421875, -0.971466064453125, -0.84844970703125, -0.725433349609375, -0.6024169921875, -0.479400634765625, -0.35638427734375, -0.233367919921875, -0.1103515625, 0.012664794921875, 0.13568115234375, 0.258697509765625, 0.3817138671875, 0.504730224609375, 0.62774658203125, 0.750762939453125, 0.873779296875, 0.996795654296875, 1.11981201171875, 1.242828369140625, 1.3658447265625, 1.488861083984375, 1.61187744140625, 1.734893798828125, 1.85791015625, 1.980926513671875, 2.10394287109375, 2.226959228515625, 2.3499755859375, 2.472991943359375, 2.59600830078125, 2.719024658203125, 2.842041015625, 2.965057373046875, 3.08807373046875, 3.211090087890625, 3.3341064453125, 3.457122802734375, 3.58013916015625, 3.703155517578125, 3.826171875]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 6.0, 9.0, 15.0, 17.0, 25.0, 32.0, 47.0, 114.0, 174.0, 258.0, 438.0, 731.0, 1217.0, 2052.0, 3395.0, 5520.0, 9215.0, 15369.0, 25379.0, 42081.0, 68286.0, 107979.0, 155898.0, 1228516.0, 153608.0, 105608.0, 66709.0, 41099.0, 24865.0, 15166.0, 9175.0, 5618.0, 3322.0, 2081.0, 1217.0, 730.0, 478.0, 242.0, 199.0, 102.0, 55.0, 30.0, 18.0, 15.0, 12.0, 8.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.368408203125, -0.3563232421875, -0.34423828125, -0.3321533203125, -0.320068359375, -0.3079833984375, -0.2958984375, -0.2838134765625, -0.271728515625, -0.2596435546875, -0.24755859375, -0.2354736328125, -0.223388671875, -0.2113037109375, -0.19921875, -0.1871337890625, -0.175048828125, -0.1629638671875, -0.15087890625, -0.1387939453125, -0.126708984375, -0.1146240234375, -0.1025390625, -0.0904541015625, -0.078369140625, -0.0662841796875, -0.05419921875, -0.0421142578125, -0.030029296875, -0.0179443359375, -0.005859375, 0.0062255859375, 0.018310546875, 0.0303955078125, 0.04248046875, 0.0545654296875, 0.066650390625, 0.0787353515625, 0.0908203125, 0.1029052734375, 0.114990234375, 0.1270751953125, 0.13916015625, 0.1512451171875, 0.163330078125, 0.1754150390625, 0.1875, 0.1995849609375, 0.211669921875, 0.2237548828125, 0.23583984375, 0.2479248046875, 0.260009765625, 0.2720947265625, 0.2841796875, 0.2962646484375, 0.308349609375, 0.3204345703125, 0.33251953125, 0.3446044921875, 0.356689453125, 0.3687744140625, 0.380859375, 0.3929443359375, 0.405029296875]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 7.0, 3.0, 3.0, 5.0, 5.0, 9.0, 11.0, 11.0, 14.0, 18.0, 21.0, 21.0, 24.0, 34.0, 53.0, 57.0, 59.0, 69.0, 67.0, 56.0, 73.0, 51.0, 50.0, 63.0, 41.0, 32.0, 22.0, 31.0, 20.0, 19.0, 7.0, 6.0, 9.0, 8.0, 7.0, 5.0, 7.0, 5.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.0033111572265625, -0.003223031759262085, -0.00313490629196167, -0.003046780824661255, -0.00295865535736084, -0.002870529890060425, -0.0027824044227600098, -0.0026942789554595947, -0.0026061534881591797, -0.0025180280208587646, -0.0024299025535583496, -0.0023417770862579346, -0.0022536516189575195, -0.0021655261516571045, -0.0020774006843566895, -0.0019892752170562744, -0.0019011497497558594, -0.0018130242824554443, -0.0017248988151550293, -0.0016367733478546143, -0.0015486478805541992, -0.0014605224132537842, -0.0013723969459533691, -0.001284271478652954, -0.001196146011352539, -0.001108020544052124, -0.001019895076751709, -0.0009317696094512939, -0.0008436441421508789, -0.0007555186748504639, -0.0006673932075500488, -0.0005792677402496338, -0.0004911422729492188, -0.0004030168056488037, -0.00031489133834838867, -0.00022676587104797363, -0.0001386404037475586, -5.0514936447143555e-05, 3.7610530853271484e-05, 0.00012573599815368652, 0.00021386146545410156, 0.0003019869327545166, 0.00039011240005493164, 0.0004782378673553467, 0.0005663633346557617, 0.0006544888019561768, 0.0007426142692565918, 0.0008307397365570068, 0.0009188652038574219, 0.001006990671157837, 0.001095116138458252, 0.001183241605758667, 0.001271367073059082, 0.001359492540359497, 0.0014476180076599121, 0.0015357434749603271, 0.0016238689422607422, 0.0017119944095611572, 0.0018001198768615723, 0.0018882453441619873, 0.0019763708114624023, 0.0020644962787628174, 0.0021526217460632324, 0.0022407472133636475, 0.0023288726806640625]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 7.0, 6.0, 5.0, 13.0, 10.0, 11.0, 11.0, 19.0, 25.0, 42.0, 55.0, 78.0, 99.0, 123.0, 202.0, 283.0, 535.0, 3627.0, 953122.0, 87945.0, 1095.0, 403.0, 239.0, 148.0, 121.0, 100.0, 57.0, 49.0, 44.0, 22.0, 19.0, 14.0, 9.0, 6.0, 7.0, 2.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.047515869140625, -0.04574155807495117, -0.043967247009277344, -0.042192935943603516, -0.04041862487792969, -0.03864431381225586, -0.03687000274658203, -0.0350956916809082, -0.033321380615234375, -0.03154706954956055, -0.02977275848388672, -0.02799844741821289, -0.026224136352539062, -0.024449825286865234, -0.022675514221191406, -0.020901203155517578, -0.01912689208984375, -0.017352581024169922, -0.015578269958496094, -0.013803958892822266, -0.012029647827148438, -0.01025533676147461, -0.008481025695800781, -0.006706714630126953, -0.004932403564453125, -0.003158092498779297, -0.0013837814331054688, 0.0003905296325683594, 0.0021648406982421875, 0.003939151763916016, 0.005713462829589844, 0.007487773895263672, 0.0092620849609375, 0.011036396026611328, 0.012810707092285156, 0.014585018157958984, 0.016359329223632812, 0.01813364028930664, 0.01990795135498047, 0.021682262420654297, 0.023456573486328125, 0.025230884552001953, 0.02700519561767578, 0.02877950668334961, 0.030553817749023438, 0.032328128814697266, 0.034102439880371094, 0.03587675094604492, 0.03765106201171875, 0.03942537307739258, 0.041199684143066406, 0.042973995208740234, 0.04474830627441406, 0.04652261734008789, 0.04829692840576172, 0.05007123947143555, 0.051845550537109375, 0.0536198616027832, 0.05539417266845703, 0.05716848373413086, 0.05894279479980469, 0.060717105865478516, 0.062491416931152344, 0.06426572799682617, 0.0660400390625]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 10.0, 443.0, 531.0, 31.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.016857799142599106, -0.016347317025065422, -0.015836836770176888, -0.015326354652643204, -0.014815873466432095, -0.014305392280220985, -0.013794910162687302, -0.013284428976476192, -0.012773947790265083, -0.012263466604053974, -0.011752985417842865, -0.011242503300309181, -0.010732022114098072, -0.010221540927886963, -0.009711058810353279, -0.00920057762414217, -0.00869009643793106, -0.008179615251719952, -0.007669133599847555, -0.007158651947975159, -0.0066481707617640495, -0.00613768957555294, -0.005627207923680544, -0.005116726271808147, -0.004606245085597038, -0.004095763899385929, -0.0035852822475135326, -0.00307480082847178, -0.002564319409430027, -0.002053837990388274, -0.0015433565713465214, -0.0010328751523047686, -0.000522395595908165, -1.1914176866412163e-05, 0.0004985672421753407, 0.0010090486612170935, 0.0015195300802588463, 0.002030011499300599, 0.002540492918342352, 0.0030509743373841047, 0.0035614557564258575, 0.004071936942636967, 0.004582418594509363, 0.00509290024638176, 0.005603381432592869, 0.006113862618803978, 0.0066243442706763744, 0.007134825922548771, 0.00764530710875988, 0.00815578829497099, 0.008666269481182098, 0.009176751598715782, 0.009687232784926891, 0.010197713971138, 0.010708196088671684, 0.011218677274882793, 0.011729158461093903, 0.012239639647305012, 0.012750120833516121, 0.013260602951049805, 0.013771084137260914, 0.014281565323472023, 0.014792047441005707, 0.015302528627216816, 0.015813009813427925]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 5.0, 4.0, 2.0, 3.0, 10.0, 5.0, 8.0, 9.0, 10.0, 22.0, 25.0, 13.0, 20.0, 24.0, 26.0, 32.0, 23.0, 37.0, 31.0, 33.0, 31.0, 24.0, 36.0, 45.0, 52.0, 47.0, 45.0, 34.0, 36.0, 28.0, 42.0, 23.0, 31.0, 24.0, 20.0, 29.0, 12.0, 17.0, 14.0, 10.0, 17.0, 13.0, 13.0, 5.0, 3.0, 2.0, 3.0, 5.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0013415217399597168, -0.0012950357049703598, -0.0012485496699810028, -0.0012020636349916458, -0.0011555776000022888, -0.0011090915650129318, -0.0010626055300235748, -0.0010161194950342178, -0.0009696334600448608, -0.0009231474250555038, -0.0008766613900661469, -0.0008301753550767899, -0.0007836893200874329, -0.0007372032850980759, -0.0006907172501087189, -0.0006442312151193619, -0.0005977451801300049, -0.0005512591451406479, -0.0005047731101512909, -0.0004582870751619339, -0.0004118010401725769, -0.0003653150051832199, -0.0003188289701938629, -0.0002723429352045059, -0.00022585690021514893, -0.00017937086522579193, -0.00013288483023643494, -8.639879524707794e-05, -3.991276025772095e-05, 6.573274731636047e-06, 5.305930972099304e-05, 9.954534471035004e-05, 0.00014603137969970703, 0.00019251741468906403, 0.00023900344967842102, 0.000285489484667778, 0.000331975519657135, 0.000378461554646492, 0.000424947589635849, 0.000471433624625206, 0.000517919659614563, 0.00056440569460392, 0.000610891729593277, 0.000657377764582634, 0.000703863799571991, 0.000750349834561348, 0.000796835869550705, 0.000843321904540062, 0.0008898079395294189, 0.0009362939745187759, 0.000982780009508133, 0.00102926604449749, 0.001075752079486847, 0.001122238114476204, 0.001168724149465561, 0.001215210184454918, 0.001261696219444275, 0.001308182254433632, 0.001354668289422989, 0.0014011543244123459, 0.0014476403594017029, 0.0014941263943910599, 0.0015406124293804169, 0.0015870984643697739, 0.0016335844993591309]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 5.0, 4.0, 9.0, 7.0, 6.0, 19.0, 19.0, 13.0, 18.0, 32.0, 21.0, 31.0, 33.0, 24.0, 36.0, 40.0, 48.0, 49.0, 47.0, 48.0, 38.0, 39.0, 41.0, 35.0, 46.0, 33.0, 37.0, 31.0, 32.0, 33.0, 24.0, 18.0, 21.0, 10.0, 13.0, 3.0, 13.0, 10.0, 8.0, 2.0, 4.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.50390625, -5.34686279296875, -5.1898193359375, -5.03277587890625, -4.875732421875, -4.71868896484375, -4.5616455078125, -4.40460205078125, -4.24755859375, -4.09051513671875, -3.9334716796875, -3.77642822265625, -3.619384765625, -3.46234130859375, -3.3052978515625, -3.14825439453125, -2.9912109375, -2.83416748046875, -2.6771240234375, -2.52008056640625, -2.363037109375, -2.20599365234375, -2.0489501953125, -1.89190673828125, -1.73486328125, -1.57781982421875, -1.4207763671875, -1.26373291015625, -1.106689453125, -0.94964599609375, -0.7926025390625, -0.63555908203125, -0.478515625, -0.32147216796875, -0.1644287109375, -0.00738525390625, 0.149658203125, 0.30670166015625, 0.4637451171875, 0.62078857421875, 0.77783203125, 0.93487548828125, 1.0919189453125, 1.24896240234375, 1.406005859375, 1.56304931640625, 1.7200927734375, 1.87713623046875, 2.0341796875, 2.19122314453125, 2.3482666015625, 2.50531005859375, 2.662353515625, 2.81939697265625, 2.9764404296875, 3.13348388671875, 3.29052734375, 3.44757080078125, 3.6046142578125, 3.76165771484375, 3.918701171875, 4.07574462890625, 4.2327880859375, 4.38983154296875, 4.546875]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 8.0, 4.0, 5.0, 16.0, 12.0, 17.0, 33.0, 47.0, 64.0, 100.0, 127.0, 189.0, 265.0, 413.0, 626.0, 964.0, 1428.0, 2303.0, 4158.0, 8233.0, 19779.0, 63299.0, 265849.0, 489946.0, 129315.0, 34752.0, 12404.0, 5773.0, 3169.0, 1792.0, 1121.0, 749.0, 535.0, 315.0, 231.0, 159.0, 110.0, 75.0, 46.0, 42.0, 25.0, 15.0, 17.0, 6.0, 4.0, 4.0, 8.0, 11.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.0390625, -3.913848876953125, -3.78863525390625, -3.663421630859375, -3.5382080078125, -3.412994384765625, -3.28778076171875, -3.162567138671875, -3.037353515625, -2.912139892578125, -2.78692626953125, -2.661712646484375, -2.5364990234375, -2.411285400390625, -2.28607177734375, -2.160858154296875, -2.03564453125, -1.910430908203125, -1.78521728515625, -1.660003662109375, -1.5347900390625, -1.409576416015625, -1.28436279296875, -1.159149169921875, -1.033935546875, -0.908721923828125, -0.78350830078125, -0.658294677734375, -0.5330810546875, -0.407867431640625, -0.28265380859375, -0.157440185546875, -0.0322265625, 0.092987060546875, 0.21820068359375, 0.343414306640625, 0.4686279296875, 0.593841552734375, 0.71905517578125, 0.844268798828125, 0.969482421875, 1.094696044921875, 1.21990966796875, 1.345123291015625, 1.4703369140625, 1.595550537109375, 1.72076416015625, 1.845977783203125, 1.97119140625, 2.096405029296875, 2.22161865234375, 2.346832275390625, 2.4720458984375, 2.597259521484375, 2.72247314453125, 2.847686767578125, 2.972900390625, 3.098114013671875, 3.22332763671875, 3.348541259765625, 3.4737548828125, 3.598968505859375, 3.72418212890625, 3.849395751953125, 3.974609375]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 7.0, 4.0, 1.0, 4.0, 8.0, 12.0, 9.0, 9.0, 15.0, 16.0, 26.0, 24.0, 26.0, 34.0, 31.0, 51.0, 54.0, 49.0, 62.0, 113.0, 1731.0, 276.0, 77.0, 55.0, 49.0, 48.0, 39.0, 37.0, 37.0, 21.0, 29.0, 27.0, 17.0, 11.0, 12.0, 11.0, 9.0, 7.0, 6.0, 2.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.859375, -16.25244140625, -15.6455078125, -15.03857421875, -14.431640625, -13.82470703125, -13.2177734375, -12.61083984375, -12.00390625, -11.39697265625, -10.7900390625, -10.18310546875, -9.576171875, -8.96923828125, -8.3623046875, -7.75537109375, -7.1484375, -6.54150390625, -5.9345703125, -5.32763671875, -4.720703125, -4.11376953125, -3.5068359375, -2.89990234375, -2.29296875, -1.68603515625, -1.0791015625, -0.47216796875, 0.134765625, 0.74169921875, 1.3486328125, 1.95556640625, 2.5625, 3.16943359375, 3.7763671875, 4.38330078125, 4.990234375, 5.59716796875, 6.2041015625, 6.81103515625, 7.41796875, 8.02490234375, 8.6318359375, 9.23876953125, 9.845703125, 10.45263671875, 11.0595703125, 11.66650390625, 12.2734375, 12.88037109375, 13.4873046875, 14.09423828125, 14.701171875, 15.30810546875, 15.9150390625, 16.52197265625, 17.12890625, 17.73583984375, 18.3427734375, 18.94970703125, 19.556640625, 20.16357421875, 20.7705078125, 21.37744140625, 21.984375]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 0.0, 2.0, 13.0, 4.0, 3.0, 14.0, 12.0, 11.0, 19.0, 24.0, 31.0, 42.0, 49.0, 69.0, 76.0, 126.0, 218.0, 460.0, 1378.0, 18918.0, 3061004.0, 59624.0, 2330.0, 491.0, 243.0, 153.0, 97.0, 72.0, 51.0, 42.0, 26.0, 23.0, 16.0, 19.0, 7.0, 11.0, 12.0, 5.0, 1.0, 5.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-35.875, -34.895751953125, -33.91650390625, -32.937255859375, -31.9580078125, -30.978759765625, -29.99951171875, -29.020263671875, -28.041015625, -27.061767578125, -26.08251953125, -25.103271484375, -24.1240234375, -23.144775390625, -22.16552734375, -21.186279296875, -20.20703125, -19.227783203125, -18.24853515625, -17.269287109375, -16.2900390625, -15.310791015625, -14.33154296875, -13.352294921875, -12.373046875, -11.393798828125, -10.41455078125, -9.435302734375, -8.4560546875, -7.476806640625, -6.49755859375, -5.518310546875, -4.5390625, -3.559814453125, -2.58056640625, -1.601318359375, -0.6220703125, 0.357177734375, 1.33642578125, 2.315673828125, 3.294921875, 4.274169921875, 5.25341796875, 6.232666015625, 7.2119140625, 8.191162109375, 9.17041015625, 10.149658203125, 11.12890625, 12.108154296875, 13.08740234375, 14.066650390625, 15.0458984375, 16.025146484375, 17.00439453125, 17.983642578125, 18.962890625, 19.942138671875, 20.92138671875, 21.900634765625, 22.8798828125, 23.859130859375, 24.83837890625, 25.817626953125, 26.796875]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 42.0, 330.0, 538.0, 97.0, 10.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.038566589355469, -11.344952583312988, -8.651338577270508, -5.957724571228027, -3.264110565185547, -0.5704965591430664, 2.123117446899414, 4.816730499267578, 7.510345458984375, 10.203959465026855, 12.897573471069336, 15.591187477111816, 18.284801483154297, 20.978416442871094, 23.672029495239258, 26.365642547607422, 29.05925750732422, 31.752872467041016, 34.44648742675781, 37.140098571777344, 39.83371353149414, 42.52732849121094, 45.22093963623047, 47.914554595947266, 50.60816955566406, 53.30178451538086, 55.995399475097656, 58.68901062011719, 61.382625579833984, 64.07624053955078, 66.76985168457031, 69.46347045898438, 72.15708923339844, 74.85070037841797, 77.54431915283203, 80.23793029785156, 82.93154907226562, 85.62516021728516, 88.31877136230469, 91.01239013671875, 93.70600128173828, 96.39961242675781, 99.09323120117188, 101.7868423461914, 104.48045349121094, 107.174072265625, 109.86768341064453, 112.56129455566406, 115.25491333007812, 117.94852447509766, 120.64214324951172, 123.33575439453125, 126.02937316894531, 128.7229766845703, 131.41659545898438, 134.11021423339844, 136.8038330078125, 139.49745178222656, 142.19105529785156, 144.88467407226562, 147.5782928466797, 150.2718963623047, 152.96551513671875, 155.6591339111328, 158.3527374267578]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 5.0, 7.0, 5.0, 6.0, 11.0, 9.0, 7.0, 11.0, 9.0, 14.0, 16.0, 14.0, 16.0, 20.0, 24.0, 14.0, 35.0, 29.0, 26.0, 39.0, 45.0, 28.0, 31.0, 36.0, 29.0, 36.0, 36.0, 33.0, 28.0, 53.0, 36.0, 38.0, 25.0, 29.0, 18.0, 17.0, 24.0, 19.0, 15.0, 16.0, 12.0, 15.0, 13.0, 7.0, 14.0, 4.0, 13.0, 4.0, 1.0, 6.0, 4.0, 4.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-50.27008819580078, -48.72826385498047, -47.186439514160156, -45.64461898803711, -44.1027946472168, -42.560970306396484, -41.01914978027344, -39.477325439453125, -37.93550109863281, -36.3936767578125, -34.85185241699219, -33.31003189086914, -31.768207550048828, -30.226383209228516, -28.684560775756836, -27.142738342285156, -25.600914001464844, -24.05908966064453, -22.51726722717285, -20.975444793701172, -19.43362045288086, -17.891796112060547, -16.349973678588867, -14.808150291442871, -13.266326904296875, -11.724503517150879, -10.182680130004883, -8.640856742858887, -7.099033355712891, -5.5572099685668945, -4.015386581420898, -2.4735631942749023, -0.9317359924316406, 0.6100873947143555, 2.1519107818603516, 3.6937341690063477, 5.235557556152344, 6.77738094329834, 8.319204330444336, 9.861027717590332, 11.402851104736328, 12.944674491882324, 14.48649787902832, 16.0283203125, 17.570144653320312, 19.111968994140625, 20.653791427612305, 22.195613861083984, 23.737438201904297, 25.27926254272461, 26.82108497619629, 28.36290740966797, 29.90473175048828, 31.446556091308594, 32.988380432128906, 34.53020095825195, 36.072025299072266, 37.61384963989258, 39.155670166015625, 40.69749450683594, 42.23931884765625, 43.78114318847656, 45.322967529296875, 46.86478805541992, 48.406612396240234]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 1.0, 6.0, 5.0, 8.0, 7.0, 7.0, 22.0, 15.0, 13.0, 25.0, 25.0, 26.0, 25.0, 32.0, 32.0, 32.0, 37.0, 51.0, 51.0, 34.0, 45.0, 47.0, 38.0, 35.0, 39.0, 42.0, 36.0, 33.0, 32.0, 29.0, 37.0, 26.0, 15.0, 17.0, 18.0, 10.0, 11.0, 6.0, 8.0, 8.0, 10.0, 0.0, 3.0, 3.0, 2.0, 5.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.5078125, -5.350830078125, -5.19384765625, -5.036865234375, -4.8798828125, -4.722900390625, -4.56591796875, -4.408935546875, -4.251953125, -4.094970703125, -3.93798828125, -3.781005859375, -3.6240234375, -3.467041015625, -3.31005859375, -3.153076171875, -2.99609375, -2.839111328125, -2.68212890625, -2.525146484375, -2.3681640625, -2.211181640625, -2.05419921875, -1.897216796875, -1.740234375, -1.583251953125, -1.42626953125, -1.269287109375, -1.1123046875, -0.955322265625, -0.79833984375, -0.641357421875, -0.484375, -0.327392578125, -0.17041015625, -0.013427734375, 0.1435546875, 0.300537109375, 0.45751953125, 0.614501953125, 0.771484375, 0.928466796875, 1.08544921875, 1.242431640625, 1.3994140625, 1.556396484375, 1.71337890625, 1.870361328125, 2.02734375, 2.184326171875, 2.34130859375, 2.498291015625, 2.6552734375, 2.812255859375, 2.96923828125, 3.126220703125, 3.283203125, 3.440185546875, 3.59716796875, 3.754150390625, 3.9111328125, 4.068115234375, 4.22509765625, 4.382080078125, 4.5390625]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 6.0, 3.0, 8.0, 8.0, 5.0, 15.0, 17.0, 21.0, 15.0, 17.0, 31.0, 33.0, 42.0, 104.0, 161.0, 360.0, 851.0, 3031.0, 14341.0, 103183.0, 1710362.0, 2196482.0, 142218.0, 17737.0, 3441.0, 952.0, 354.0, 167.0, 91.0, 49.0, 42.0, 21.0, 23.0, 17.0, 18.0, 14.0, 10.0, 7.0, 7.0, 8.0, 7.0, 1.0, 5.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-16.3125, -15.8336181640625, -15.354736328125, -14.8758544921875, -14.39697265625, -13.9180908203125, -13.439208984375, -12.9603271484375, -12.4814453125, -12.0025634765625, -11.523681640625, -11.0447998046875, -10.56591796875, -10.0870361328125, -9.608154296875, -9.1292724609375, -8.650390625, -8.1715087890625, -7.692626953125, -7.2137451171875, -6.73486328125, -6.2559814453125, -5.777099609375, -5.2982177734375, -4.8193359375, -4.3404541015625, -3.861572265625, -3.3826904296875, -2.90380859375, -2.4249267578125, -1.946044921875, -1.4671630859375, -0.98828125, -0.5093994140625, -0.030517578125, 0.4483642578125, 0.92724609375, 1.4061279296875, 1.885009765625, 2.3638916015625, 2.8427734375, 3.3216552734375, 3.800537109375, 4.2794189453125, 4.75830078125, 5.2371826171875, 5.716064453125, 6.1949462890625, 6.673828125, 7.1527099609375, 7.631591796875, 8.1104736328125, 8.58935546875, 9.0682373046875, 9.547119140625, 10.0260009765625, 10.5048828125, 10.9837646484375, 11.462646484375, 11.9415283203125, 12.42041015625, 12.8992919921875, 13.378173828125, 13.8570556640625, 14.3359375]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 8.0, 11.0, 16.0, 20.0, 28.0, 53.0, 79.0, 88.0, 156.0, 193.0, 326.0, 461.0, 586.0, 553.0, 468.0, 319.0, 262.0, 139.0, 101.0, 72.0, 47.0, 29.0, 19.0, 15.0, 14.0, 4.0, 5.0, 6.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-20.328125, -19.8197021484375, -19.311279296875, -18.8028564453125, -18.29443359375, -17.7860107421875, -17.277587890625, -16.7691650390625, -16.2607421875, -15.7523193359375, -15.243896484375, -14.7354736328125, -14.22705078125, -13.7186279296875, -13.210205078125, -12.7017822265625, -12.193359375, -11.6849365234375, -11.176513671875, -10.6680908203125, -10.15966796875, -9.6512451171875, -9.142822265625, -8.6343994140625, -8.1259765625, -7.6175537109375, -7.109130859375, -6.6007080078125, -6.09228515625, -5.5838623046875, -5.075439453125, -4.5670166015625, -4.05859375, -3.5501708984375, -3.041748046875, -2.5333251953125, -2.02490234375, -1.5164794921875, -1.008056640625, -0.4996337890625, 0.0087890625, 0.5172119140625, 1.025634765625, 1.5340576171875, 2.04248046875, 2.5509033203125, 3.059326171875, 3.5677490234375, 4.076171875, 4.5845947265625, 5.093017578125, 5.6014404296875, 6.10986328125, 6.6182861328125, 7.126708984375, 7.6351318359375, 8.1435546875, 8.6519775390625, 9.160400390625, 9.6688232421875, 10.17724609375, 10.6856689453125, 11.194091796875, 11.7025146484375, 12.2109375]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 7.0, 9.0, 9.0, 17.0, 19.0, 25.0, 29.0, 43.0, 62.0, 97.0, 126.0, 197.0, 388.0, 877.0, 3427.0, 33745.0, 1341233.0, 2747850.0, 59150.0, 4779.0, 1047.0, 451.0, 211.0, 152.0, 79.0, 71.0, 52.0, 38.0, 23.0, 18.0, 16.0, 5.0, 8.0, 13.0, 4.0, 2.0, 1.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.53125, -29.404296875, -28.27734375, -27.150390625, -26.0234375, -24.896484375, -23.76953125, -22.642578125, -21.515625, -20.388671875, -19.26171875, -18.134765625, -17.0078125, -15.880859375, -14.75390625, -13.626953125, -12.5, -11.373046875, -10.24609375, -9.119140625, -7.9921875, -6.865234375, -5.73828125, -4.611328125, -3.484375, -2.357421875, -1.23046875, -0.103515625, 1.0234375, 2.150390625, 3.27734375, 4.404296875, 5.53125, 6.658203125, 7.78515625, 8.912109375, 10.0390625, 11.166015625, 12.29296875, 13.419921875, 14.546875, 15.673828125, 16.80078125, 17.927734375, 19.0546875, 20.181640625, 21.30859375, 22.435546875, 23.5625, 24.689453125, 25.81640625, 26.943359375, 28.0703125, 29.197265625, 30.32421875, 31.451171875, 32.578125, 33.705078125, 34.83203125, 35.958984375, 37.0859375, 38.212890625, 39.33984375, 40.466796875, 41.59375]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 30.0, 142.0, 363.0, 322.0, 132.0, 18.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-290.1250305175781, -283.5070495605469, -276.8890686035156, -270.2710876464844, -263.6531066894531, -257.03515625, -250.4171600341797, -243.79917907714844, -237.18121337890625, -230.563232421875, -223.94525146484375, -217.3272705078125, -210.7093048095703, -204.09132385253906, -197.4733428955078, -190.85536193847656, -184.2373809814453, -177.61940002441406, -171.0014190673828, -164.38345336914062, -157.76547241210938, -151.14749145507812, -144.52951049804688, -137.91152954101562, -131.29354858398438, -124.67556762695312, -118.0575942993164, -111.43961334228516, -104.82164001464844, -98.20365905761719, -91.58567810058594, -84.96769714355469, -78.34971618652344, -71.73173522949219, -65.11376190185547, -58.49578094482422, -51.877803802490234, -45.25982666015625, -38.641845703125, -32.023868560791016, -25.40589141845703, -18.787914276123047, -12.16993522644043, -5.5519561767578125, 1.0660209655761719, 7.683998107910156, 14.301979064941406, 20.91995620727539, 27.537933349609375, 34.15591049194336, 40.773887634277344, 47.391868591308594, 54.00984573364258, 60.62782287597656, 67.24580383300781, 73.86378479003906, 80.48175811767578, 87.09973907470703, 93.71771240234375, 100.335693359375, 106.95367431640625, 113.57164764404297, 120.18962860107422, 126.80760192871094, 133.4255828857422]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 3.0, 4.0, 6.0, 15.0, 8.0, 6.0, 13.0, 13.0, 22.0, 22.0, 26.0, 26.0, 23.0, 30.0, 32.0, 32.0, 38.0, 28.0, 34.0, 46.0, 47.0, 31.0, 46.0, 41.0, 43.0, 40.0, 30.0, 39.0, 37.0, 31.0, 33.0, 21.0, 20.0, 18.0, 16.0, 19.0, 15.0, 13.0, 6.0, 11.0, 8.0, 5.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.915924072265625, -41.523773193359375, -40.131622314453125, -38.739471435546875, -37.347320556640625, -35.95517349243164, -34.56302261352539, -33.17087173461914, -31.77872085571289, -30.38656997680664, -28.99441909790039, -27.602270126342773, -26.210119247436523, -24.817968368530273, -23.425819396972656, -22.033668518066406, -20.641517639160156, -19.249366760253906, -17.857215881347656, -16.46506690979004, -15.072916030883789, -13.680765151977539, -12.288615226745605, -10.896465301513672, -9.504314422607422, -8.112163543701172, -6.720013618469238, -5.3278632164001465, -3.9357128143310547, -2.543562412261963, -1.151412010192871, 0.2407379150390625, 1.6328887939453125, 3.0250391960144043, 4.417189598083496, 5.809340000152588, 7.20149040222168, 8.59364128112793, 9.985791206359863, 11.377941131591797, 12.770092010498047, 14.162242889404297, 15.55439281463623, 16.946542739868164, 18.338693618774414, 19.730844497680664, 21.12299346923828, 22.51514434814453, 23.90729522705078, 25.29944610595703, 26.69159698486328, 28.0837459564209, 29.47589683532715, 30.8680477142334, 32.260196685791016, 33.652347564697266, 35.044498443603516, 36.436649322509766, 37.828800201416016, 39.220951080322266, 40.61309814453125, 42.0052490234375, 43.39739990234375, 44.78955078125, 46.18170166015625]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 3.0, 5.0, 5.0, 5.0, 8.0, 14.0, 11.0, 20.0, 22.0, 18.0, 16.0, 25.0, 28.0, 23.0, 25.0, 34.0, 34.0, 41.0, 46.0, 41.0, 34.0, 41.0, 43.0, 45.0, 37.0, 36.0, 36.0, 37.0, 38.0, 29.0, 27.0, 24.0, 27.0, 22.0, 12.0, 16.0, 15.0, 11.0, 14.0, 9.0, 7.0, 4.0, 5.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0], "bins": [-5.40234375, -5.2471923828125, -5.092041015625, -4.9368896484375, -4.78173828125, -4.6265869140625, -4.471435546875, -4.3162841796875, -4.1611328125, -4.0059814453125, -3.850830078125, -3.6956787109375, -3.54052734375, -3.3853759765625, -3.230224609375, -3.0750732421875, -2.919921875, -2.7647705078125, -2.609619140625, -2.4544677734375, -2.29931640625, -2.1441650390625, -1.989013671875, -1.8338623046875, -1.6787109375, -1.5235595703125, -1.368408203125, -1.2132568359375, -1.05810546875, -0.9029541015625, -0.747802734375, -0.5926513671875, -0.4375, -0.2823486328125, -0.127197265625, 0.0279541015625, 0.18310546875, 0.3382568359375, 0.493408203125, 0.6485595703125, 0.8037109375, 0.9588623046875, 1.114013671875, 1.2691650390625, 1.42431640625, 1.5794677734375, 1.734619140625, 1.8897705078125, 2.044921875, 2.2000732421875, 2.355224609375, 2.5103759765625, 2.66552734375, 2.8206787109375, 2.975830078125, 3.1309814453125, 3.2861328125, 3.4412841796875, 3.596435546875, 3.7515869140625, 3.90673828125, 4.0618896484375, 4.217041015625, 4.3721923828125, 4.52734375]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 7.0, 14.0, 21.0, 31.0, 55.0, 77.0, 113.0, 190.0, 257.0, 354.0, 530.0, 762.0, 1239.0, 1750.0, 2666.0, 4017.0, 5923.0, 8961.0, 13594.0, 20748.0, 31690.0, 49608.0, 76277.0, 113127.0, 152441.0, 164121.0, 132015.0, 93086.0, 60885.0, 39174.0, 25624.0, 16589.0, 10822.0, 7201.0, 4867.0, 3185.0, 2163.0, 1411.0, 977.0, 668.0, 415.0, 291.0, 201.0, 126.0, 98.0, 64.0, 49.0, 30.0, 11.0, 12.0, 7.0, 13.0, 2.0, 4.0], "bins": [-0.51025390625, -0.4957733154296875, -0.481292724609375, -0.4668121337890625, -0.45233154296875, -0.4378509521484375, -0.423370361328125, -0.4088897705078125, -0.3944091796875, -0.3799285888671875, -0.365447998046875, -0.3509674072265625, -0.33648681640625, -0.3220062255859375, -0.307525634765625, -0.2930450439453125, -0.278564453125, -0.2640838623046875, -0.249603271484375, -0.2351226806640625, -0.22064208984375, -0.2061614990234375, -0.191680908203125, -0.1772003173828125, -0.1627197265625, -0.1482391357421875, -0.133758544921875, -0.1192779541015625, -0.10479736328125, -0.0903167724609375, -0.075836181640625, -0.0613555908203125, -0.046875, -0.0323944091796875, -0.017913818359375, -0.0034332275390625, 0.01104736328125, 0.0255279541015625, 0.040008544921875, 0.0544891357421875, 0.0689697265625, 0.0834503173828125, 0.097930908203125, 0.1124114990234375, 0.12689208984375, 0.1413726806640625, 0.155853271484375, 0.1703338623046875, 0.184814453125, 0.1992950439453125, 0.213775634765625, 0.2282562255859375, 0.24273681640625, 0.2572174072265625, 0.271697998046875, 0.2861785888671875, 0.3006591796875, 0.3151397705078125, 0.329620361328125, 0.3441009521484375, 0.35858154296875, 0.3730621337890625, 0.387542724609375, 0.4020233154296875, 0.41650390625]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 4.0, 3.0, 6.0, 3.0, 10.0, 8.0, 17.0, 7.0, 11.0, 17.0, 22.0, 17.0, 29.0, 30.0, 29.0, 30.0, 34.0, 42.0, 50.0, 33.0, 47.0, 40.0, 1065.0, 33.0, 37.0, 34.0, 43.0, 37.0, 31.0, 37.0, 31.0, 26.0, 28.0, 18.0, 31.0, 11.0, 13.0, 19.0, 9.0, 7.0, 7.0, 8.0, 7.0, 3.0, 3.0, 3.0, 5.0, 2.0, 3.0], "bins": [-3.93359375, -3.8292236328125, -3.724853515625, -3.6204833984375, -3.51611328125, -3.4117431640625, -3.307373046875, -3.2030029296875, -3.0986328125, -2.9942626953125, -2.889892578125, -2.7855224609375, -2.68115234375, -2.5767822265625, -2.472412109375, -2.3680419921875, -2.263671875, -2.1593017578125, -2.054931640625, -1.9505615234375, -1.84619140625, -1.7418212890625, -1.637451171875, -1.5330810546875, -1.4287109375, -1.3243408203125, -1.219970703125, -1.1156005859375, -1.01123046875, -0.9068603515625, -0.802490234375, -0.6981201171875, -0.59375, -0.4893798828125, -0.385009765625, -0.2806396484375, -0.17626953125, -0.0718994140625, 0.032470703125, 0.1368408203125, 0.2412109375, 0.3455810546875, 0.449951171875, 0.5543212890625, 0.65869140625, 0.7630615234375, 0.867431640625, 0.9718017578125, 1.076171875, 1.1805419921875, 1.284912109375, 1.3892822265625, 1.49365234375, 1.5980224609375, 1.702392578125, 1.8067626953125, 1.9111328125, 2.0155029296875, 2.119873046875, 2.2242431640625, 2.32861328125, 2.4329833984375, 2.537353515625, 2.6417236328125, 2.74609375]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 7.0, 5.0, 8.0, 12.0, 10.0, 31.0, 34.0, 83.0, 106.0, 166.0, 276.0, 434.0, 701.0, 1065.0, 1837.0, 2882.0, 4471.0, 7062.0, 10878.0, 16859.0, 25970.0, 40017.0, 61382.0, 92321.0, 130035.0, 1200742.0, 154481.0, 116473.0, 79995.0, 52644.0, 34136.0, 22217.0, 14269.0, 9221.0, 5895.0, 3897.0, 2435.0, 1528.0, 995.0, 567.0, 357.0, 233.0, 138.0, 103.0, 55.0, 43.0, 26.0, 17.0, 5.0, 6.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.3671875, -0.3559989929199219, -0.34481048583984375, -0.3336219787597656, -0.3224334716796875, -0.3112449645996094, -0.30005645751953125, -0.2888679504394531, -0.277679443359375, -0.2664909362792969, -0.25530242919921875, -0.24411392211914062, -0.2329254150390625, -0.22173690795898438, -0.21054840087890625, -0.19935989379882812, -0.18817138671875, -0.17698287963867188, -0.16579437255859375, -0.15460586547851562, -0.1434173583984375, -0.13222885131835938, -0.12104034423828125, -0.10985183715820312, -0.098663330078125, -0.08747482299804688, -0.07628631591796875, -0.06509780883789062, -0.0539093017578125, -0.042720794677734375, -0.03153228759765625, -0.020343780517578125, -0.0091552734375, 0.002033233642578125, 0.01322174072265625, 0.024410247802734375, 0.0355987548828125, 0.046787261962890625, 0.05797576904296875, 0.06916427612304688, 0.080352783203125, 0.09154129028320312, 0.10272979736328125, 0.11391830444335938, 0.1251068115234375, 0.13629531860351562, 0.14748382568359375, 0.15867233276367188, 0.16986083984375, 0.18104934692382812, 0.19223785400390625, 0.20342636108398438, 0.2146148681640625, 0.22580337524414062, 0.23699188232421875, 0.24818038940429688, 0.259368896484375, 0.2705574035644531, 0.28174591064453125, 0.2929344177246094, 0.3041229248046875, 0.3153114318847656, 0.32649993896484375, 0.3376884460449219, 0.348876953125]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 8.0, 2.0, 5.0, 3.0, 7.0, 10.0, 14.0, 16.0, 20.0, 23.0, 21.0, 25.0, 37.0, 42.0, 50.0, 76.0, 82.0, 78.0, 73.0, 68.0, 53.0, 43.0, 50.0, 32.0, 29.0, 32.0, 14.0, 19.0, 10.0, 9.0, 11.0, 8.0, 6.0, 9.0, 5.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0029582977294921875, -0.0028679370880126953, -0.002777576446533203, -0.002687215805053711, -0.0025968551635742188, -0.0025064945220947266, -0.0024161338806152344, -0.002325773239135742, -0.00223541259765625, -0.002145051956176758, -0.0020546913146972656, -0.0019643306732177734, -0.0018739700317382812, -0.001783609390258789, -0.0016932487487792969, -0.0016028881072998047, -0.0015125274658203125, -0.0014221668243408203, -0.0013318061828613281, -0.001241445541381836, -0.0011510848999023438, -0.0010607242584228516, -0.0009703636169433594, -0.0008800029754638672, -0.000789642333984375, -0.0006992816925048828, -0.0006089210510253906, -0.0005185604095458984, -0.00042819976806640625, -0.00033783912658691406, -0.0002474784851074219, -0.0001571178436279297, -6.67572021484375e-05, 2.3603439331054688e-05, 0.00011396408081054688, 0.00020432472229003906, 0.00029468536376953125, 0.00038504600524902344, 0.0004754066467285156, 0.0005657672882080078, 0.0006561279296875, 0.0007464885711669922, 0.0008368492126464844, 0.0009272098541259766, 0.0010175704956054688, 0.001107931137084961, 0.0011982917785644531, 0.0012886524200439453, 0.0013790130615234375, 0.0014693737030029297, 0.0015597343444824219, 0.001650094985961914, 0.0017404556274414062, 0.0018308162689208984, 0.0019211769104003906, 0.002011537551879883, 0.002101898193359375, 0.002192258834838867, 0.0022826194763183594, 0.0023729801177978516, 0.0024633407592773438, 0.002553701400756836, 0.002644062042236328, 0.0027344226837158203, 0.0028247833251953125]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 9.0, 7.0, 5.0, 7.0, 12.0, 11.0, 6.0, 19.0, 31.0, 41.0, 49.0, 62.0, 107.0, 167.0, 263.0, 470.0, 1367.0, 215607.0, 826420.0, 2439.0, 550.0, 293.0, 187.0, 133.0, 74.0, 48.0, 43.0, 26.0, 24.0, 16.0, 15.0, 8.0, 5.0, 10.0, 6.0, 6.0, 0.0, 3.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.05712890625, -0.055350303649902344, -0.05357170104980469, -0.05179309844970703, -0.050014495849609375, -0.04823589324951172, -0.04645729064941406, -0.044678688049316406, -0.04290008544921875, -0.041121482849121094, -0.03934288024902344, -0.03756427764892578, -0.035785675048828125, -0.03400707244873047, -0.03222846984863281, -0.030449867248535156, -0.0286712646484375, -0.026892662048339844, -0.025114059448242188, -0.02333545684814453, -0.021556854248046875, -0.01977825164794922, -0.017999649047851562, -0.016221046447753906, -0.01444244384765625, -0.012663841247558594, -0.010885238647460938, -0.009106636047363281, -0.007328033447265625, -0.005549430847167969, -0.0037708282470703125, -0.0019922256469726562, -0.000213623046875, 0.0015649795532226562, 0.0033435821533203125, 0.005122184753417969, 0.006900787353515625, 0.008679389953613281, 0.010457992553710938, 0.012236595153808594, 0.01401519775390625, 0.015793800354003906, 0.017572402954101562, 0.01935100555419922, 0.021129608154296875, 0.02290821075439453, 0.024686813354492188, 0.026465415954589844, 0.0282440185546875, 0.030022621154785156, 0.03180122375488281, 0.03357982635498047, 0.035358428955078125, 0.03713703155517578, 0.03891563415527344, 0.040694236755371094, 0.04247283935546875, 0.044251441955566406, 0.04603004455566406, 0.04780864715576172, 0.049587249755859375, 0.05136585235595703, 0.05314445495605469, 0.054923057556152344, 0.05670166015625]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 7.0, 167.0, 644.0, 180.0, 14.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006655517499893904, -0.006295669823884964, -0.005935822147876024, -0.0055759744718670845, -0.005216127261519432, -0.004856279119849205, -0.004496431909501553, -0.004136584233492613, -0.003776736557483673, -0.0034168888814747334, -0.0030570412054657936, -0.0026971937622874975, -0.0023373460862785578, -0.001977498410269618, -0.001617650967091322, -0.0012578032910823822, -0.0008979556150734425, -0.0005381079972721636, -0.0001782603794708848, 0.00018158718012273312, 0.0005414348561316729, 0.0009012825321406126, 0.0012611299753189087, 0.0016209776513278484, 0.001980825327336788, 0.002340673003345728, 0.0027005206793546677, 0.0030603681225329638, 0.0034202157985419035, 0.0037800634745508432, 0.004139910917729139, 0.004499758593738079, 0.0048596058040857315, 0.005219453480094671, 0.005579301156103611, 0.005939148366451263, 0.0062989965081214905, 0.006658843718469143, 0.007018691394478083, 0.007378539070487022, 0.007738386746495962, 0.008098234422504902, 0.008458081632852554, 0.008817929774522781, 0.009177776984870434, 0.00953762512654066, 0.009897472336888313, 0.01025732047855854, 0.010617167688906193, 0.010977014899253845, 0.011336863040924072, 0.011696710251271725, 0.012056558392941952, 0.012416405603289604, 0.012776253744959831, 0.013136100955307484, 0.013495948165655136, 0.013855795376002789, 0.014215643517673016, 0.014575490728020668, 0.014935338869690895, 0.015295186080038548, 0.0156550332903862, 0.016014881432056427, 0.016374729573726654]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 2.0, 8.0, 10.0, 10.0, 16.0, 14.0, 16.0, 17.0, 30.0, 44.0, 39.0, 34.0, 60.0, 53.0, 32.0, 53.0, 47.0, 48.0, 52.0, 53.0, 45.0, 44.0, 31.0, 38.0, 33.0, 31.0, 27.0, 17.0, 17.0, 22.0, 8.0, 14.0, 11.0, 7.0, 11.0, 3.0, 6.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0020488500595092773, -0.0019908715039491653, -0.0019328929483890533, -0.0018749143928289413, -0.0018169358372688293, -0.0017589572817087173, -0.0017009787261486053, -0.0016430001705884933, -0.0015850216150283813, -0.0015270430594682693, -0.0014690645039081573, -0.0014110859483480453, -0.0013531073927879333, -0.0012951288372278214, -0.0012371502816677094, -0.0011791717261075974, -0.0011211931705474854, -0.0010632146149873734, -0.0010052360594272614, -0.0009472575038671494, -0.0008892789483070374, -0.0008313003927469254, -0.0007733218371868134, -0.0007153432816267014, -0.0006573647260665894, -0.0005993861705064774, -0.0005414076149463654, -0.00048342905938625336, -0.00042545050382614136, -0.00036747194826602936, -0.00030949339270591736, -0.00025151483714580536, -0.00019353628158569336, -0.00013555772602558136, -7.757917046546936e-05, -1.960061490535736e-05, 3.837794065475464e-05, 9.635649621486664e-05, 0.00015433505177497864, 0.00021231360733509064, 0.00027029216289520264, 0.00032827071845531464, 0.00038624927401542664, 0.00044422782957553864, 0.0005022063851356506, 0.0005601849406957626, 0.0006181634962558746, 0.0006761420518159866, 0.0007341206073760986, 0.0007920991629362106, 0.0008500777184963226, 0.0009080562740564346, 0.0009660348296165466, 0.0010240133851766586, 0.0010819919407367706, 0.0011399704962968826, 0.0011979490518569946, 0.0012559276074171066, 0.0013139061629772186, 0.0013718847185373306, 0.0014298632740974426, 0.0014878418296575546, 0.0015458203852176666, 0.0016037989407777786, 0.0016617774963378906]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 3.0, 5.0, 5.0, 5.0, 8.0, 14.0, 11.0, 20.0, 22.0, 18.0, 16.0, 25.0, 28.0, 23.0, 25.0, 34.0, 34.0, 41.0, 46.0, 41.0, 34.0, 41.0, 43.0, 45.0, 37.0, 36.0, 36.0, 37.0, 37.0, 30.0, 27.0, 24.0, 27.0, 22.0, 13.0, 15.0, 15.0, 11.0, 14.0, 9.0, 7.0, 4.0, 5.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0], "bins": [-5.40234375, -5.2471923828125, -5.092041015625, -4.9368896484375, -4.78173828125, -4.6265869140625, -4.471435546875, -4.3162841796875, -4.1611328125, -4.0059814453125, -3.850830078125, -3.6956787109375, -3.54052734375, -3.3853759765625, -3.230224609375, -3.0750732421875, -2.919921875, -2.7647705078125, -2.609619140625, -2.4544677734375, -2.29931640625, -2.1441650390625, -1.989013671875, -1.8338623046875, -1.6787109375, -1.5235595703125, -1.368408203125, -1.2132568359375, -1.05810546875, -0.9029541015625, -0.747802734375, -0.5926513671875, -0.4375, -0.2823486328125, -0.127197265625, 0.0279541015625, 0.18310546875, 0.3382568359375, 0.493408203125, 0.6485595703125, 0.8037109375, 0.9588623046875, 1.114013671875, 1.2691650390625, 1.42431640625, 1.5794677734375, 1.734619140625, 1.8897705078125, 2.044921875, 2.2000732421875, 2.355224609375, 2.5103759765625, 2.66552734375, 2.8206787109375, 2.975830078125, 3.1309814453125, 3.2861328125, 3.4412841796875, 3.596435546875, 3.7515869140625, 3.90673828125, 4.0618896484375, 4.217041015625, 4.3721923828125, 4.52734375]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 7.0, 9.0, 17.0, 18.0, 35.0, 50.0, 72.0, 117.0, 164.0, 243.0, 340.0, 527.0, 783.0, 1165.0, 1789.0, 2696.0, 4143.0, 6642.0, 12243.0, 26342.0, 74168.0, 315040.0, 438492.0, 96693.0, 31905.0, 14274.0, 7476.0, 4440.0, 2865.0, 1891.0, 1257.0, 781.0, 585.0, 404.0, 290.0, 180.0, 130.0, 73.0, 59.0, 41.0, 34.0, 28.0, 16.0, 10.0, 7.0, 4.0, 5.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.34765625, -4.2032470703125, -4.058837890625, -3.9144287109375, -3.77001953125, -3.6256103515625, -3.481201171875, -3.3367919921875, -3.1923828125, -3.0479736328125, -2.903564453125, -2.7591552734375, -2.61474609375, -2.4703369140625, -2.325927734375, -2.1815185546875, -2.037109375, -1.8927001953125, -1.748291015625, -1.6038818359375, -1.45947265625, -1.3150634765625, -1.170654296875, -1.0262451171875, -0.8818359375, -0.7374267578125, -0.593017578125, -0.4486083984375, -0.30419921875, -0.1597900390625, -0.015380859375, 0.1290283203125, 0.2734375, 0.4178466796875, 0.562255859375, 0.7066650390625, 0.85107421875, 0.9954833984375, 1.139892578125, 1.2843017578125, 1.4287109375, 1.5731201171875, 1.717529296875, 1.8619384765625, 2.00634765625, 2.1507568359375, 2.295166015625, 2.4395751953125, 2.583984375, 2.7283935546875, 2.872802734375, 3.0172119140625, 3.16162109375, 3.3060302734375, 3.450439453125, 3.5948486328125, 3.7392578125, 3.8836669921875, 4.028076171875, 4.1724853515625, 4.31689453125, 4.4613037109375, 4.605712890625, 4.7501220703125, 4.89453125]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 7.0, 2.0, 7.0, 10.0, 11.0, 5.0, 10.0, 16.0, 24.0, 23.0, 25.0, 24.0, 40.0, 30.0, 35.0, 36.0, 37.0, 52.0, 85.0, 176.0, 1699.0, 210.0, 79.0, 53.0, 41.0, 40.0, 34.0, 30.0, 24.0, 36.0, 26.0, 25.0, 15.0, 23.0, 12.0, 15.0, 6.0, 7.0, 8.0, 5.0, 5.0, 2.0, 2.0, 4.0, 1.0, 0.0, 2.0], "bins": [-21.859375, -21.27783203125, -20.6962890625, -20.11474609375, -19.533203125, -18.95166015625, -18.3701171875, -17.78857421875, -17.20703125, -16.62548828125, -16.0439453125, -15.46240234375, -14.880859375, -14.29931640625, -13.7177734375, -13.13623046875, -12.5546875, -11.97314453125, -11.3916015625, -10.81005859375, -10.228515625, -9.64697265625, -9.0654296875, -8.48388671875, -7.90234375, -7.32080078125, -6.7392578125, -6.15771484375, -5.576171875, -4.99462890625, -4.4130859375, -3.83154296875, -3.25, -2.66845703125, -2.0869140625, -1.50537109375, -0.923828125, -0.34228515625, 0.2392578125, 0.82080078125, 1.40234375, 1.98388671875, 2.5654296875, 3.14697265625, 3.728515625, 4.31005859375, 4.8916015625, 5.47314453125, 6.0546875, 6.63623046875, 7.2177734375, 7.79931640625, 8.380859375, 8.96240234375, 9.5439453125, 10.12548828125, 10.70703125, 11.28857421875, 11.8701171875, 12.45166015625, 13.033203125, 13.61474609375, 14.1962890625, 14.77783203125, 15.359375]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 8.0, 8.0, 12.0, 13.0, 13.0, 24.0, 28.0, 39.0, 57.0, 97.0, 113.0, 204.0, 374.0, 1153.0, 18679.0, 3091759.0, 30707.0, 1394.0, 366.0, 218.0, 122.0, 94.0, 63.0, 43.0, 36.0, 22.0, 12.0, 16.0, 8.0, 7.0, 7.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-42.28125, -40.8505859375, -39.419921875, -37.9892578125, -36.55859375, -35.1279296875, -33.697265625, -32.2666015625, -30.8359375, -29.4052734375, -27.974609375, -26.5439453125, -25.11328125, -23.6826171875, -22.251953125, -20.8212890625, -19.390625, -17.9599609375, -16.529296875, -15.0986328125, -13.66796875, -12.2373046875, -10.806640625, -9.3759765625, -7.9453125, -6.5146484375, -5.083984375, -3.6533203125, -2.22265625, -0.7919921875, 0.638671875, 2.0693359375, 3.5, 4.9306640625, 6.361328125, 7.7919921875, 9.22265625, 10.6533203125, 12.083984375, 13.5146484375, 14.9453125, 16.3759765625, 17.806640625, 19.2373046875, 20.66796875, 22.0986328125, 23.529296875, 24.9599609375, 26.390625, 27.8212890625, 29.251953125, 30.6826171875, 32.11328125, 33.5439453125, 34.974609375, 36.4052734375, 37.8359375, 39.2666015625, 40.697265625, 42.1279296875, 43.55859375, 44.9892578125, 46.419921875, 47.8505859375, 49.28125]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 6.0, 59.0, 307.0, 457.0, 161.0, 20.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-83.2296371459961, -80.72634887695312, -78.22306823730469, -75.71977996826172, -73.21649932861328, -70.71321105957031, -68.20993041992188, -65.7066421508789, -63.2033576965332, -60.7000732421875, -58.1967887878418, -55.693504333496094, -53.190216064453125, -50.68693542480469, -48.18364715576172, -45.680362701416016, -43.17707824707031, -40.67379379272461, -38.170509338378906, -35.6672248840332, -33.1639404296875, -30.660654067993164, -28.157367706298828, -25.654083251953125, -23.150798797607422, -20.64751434326172, -18.144229888916016, -15.64094352722168, -13.137659072875977, -10.634374618530273, -8.131089210510254, -5.627803802490234, -3.1245193481445312, -0.6212344169616699, 1.8820505142211914, 4.385335445404053, 6.888620376586914, 9.391904830932617, 11.895190238952637, 14.398475646972656, 16.90176010131836, 19.405044555664062, 21.908329010009766, 24.4116153717041, 26.914899826049805, 29.418184280395508, 31.921470642089844, 34.42475509643555, 36.92803955078125, 39.43132400512695, 41.934608459472656, 44.43789291381836, 46.94117736816406, 49.44446563720703, 51.947750091552734, 54.45103454589844, 56.95431900024414, 59.457603454589844, 61.96088790893555, 64.46417236328125, 66.96746063232422, 69.47074127197266, 71.97402954101562, 74.47731018066406, 76.98059844970703]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 2.0, 6.0, 6.0, 8.0, 10.0, 6.0, 17.0, 16.0, 20.0, 24.0, 16.0, 27.0, 23.0, 34.0, 32.0, 39.0, 44.0, 32.0, 38.0, 31.0, 31.0, 43.0, 52.0, 44.0, 32.0, 29.0, 41.0, 31.0, 42.0, 33.0, 28.0, 19.0, 17.0, 26.0, 24.0, 12.0, 9.0, 13.0, 13.0, 5.0, 5.0, 4.0, 6.0, 4.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-51.48713302612305, -49.892730712890625, -48.29833221435547, -46.70392990112305, -45.10953140258789, -43.51512908935547, -41.92073059082031, -40.32632827758789, -38.73192596435547, -37.13752365112305, -35.54312515258789, -33.94872283935547, -32.35432434082031, -30.75992202758789, -29.1655216217041, -27.571121215820312, -25.976722717285156, -24.382322311401367, -22.787921905517578, -21.193519592285156, -19.59912109375, -18.004718780517578, -16.41031837463379, -14.81591796875, -13.221517562866211, -11.627117156982422, -10.032716751098633, -8.438315391540527, -6.843914985656738, -5.249514579772949, -3.6551132202148438, -2.0607128143310547, -0.46631622314453125, 1.128084421157837, 2.722485065460205, 4.316885948181152, 5.911286354064941, 7.5056867599487305, 9.100088119506836, 10.694488525390625, 12.288888931274414, 13.883289337158203, 15.477689743041992, 17.07209014892578, 18.666492462158203, 20.26089096069336, 21.85529327392578, 23.44969367980957, 25.04409408569336, 26.63849449157715, 28.232894897460938, 29.82729721069336, 31.421695709228516, 33.01609802246094, 34.610496520996094, 36.204898834228516, 37.79930114746094, 39.39370346069336, 40.988101959228516, 42.58250427246094, 44.176902770996094, 45.771305084228516, 47.36570739746094, 48.960105895996094, 50.55450439453125]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 4.0, 1.0, 8.0, 1.0, 5.0, 8.0, 7.0, 11.0, 15.0, 17.0, 18.0, 24.0, 20.0, 22.0, 19.0, 27.0, 27.0, 38.0, 41.0, 34.0, 35.0, 42.0, 47.0, 42.0, 30.0, 38.0, 35.0, 36.0, 38.0, 41.0, 26.0, 29.0, 31.0, 23.0, 29.0, 18.0, 20.0, 17.0, 13.0, 13.0, 13.0, 12.0, 9.0, 5.0, 4.0, 4.0, 3.0, 2.0, 1.0, 3.0, 3.0, 0.0, 3.0], "bins": [-5.3515625, -5.19842529296875, -5.0452880859375, -4.89215087890625, -4.739013671875, -4.58587646484375, -4.4327392578125, -4.27960205078125, -4.12646484375, -3.97332763671875, -3.8201904296875, -3.66705322265625, -3.513916015625, -3.36077880859375, -3.2076416015625, -3.05450439453125, -2.9013671875, -2.74822998046875, -2.5950927734375, -2.44195556640625, -2.288818359375, -2.13568115234375, -1.9825439453125, -1.82940673828125, -1.67626953125, -1.52313232421875, -1.3699951171875, -1.21685791015625, -1.063720703125, -0.91058349609375, -0.7574462890625, -0.60430908203125, -0.451171875, -0.29803466796875, -0.1448974609375, 0.00823974609375, 0.161376953125, 0.31451416015625, 0.4676513671875, 0.62078857421875, 0.77392578125, 0.92706298828125, 1.0802001953125, 1.23333740234375, 1.386474609375, 1.53961181640625, 1.6927490234375, 1.84588623046875, 1.9990234375, 2.15216064453125, 2.3052978515625, 2.45843505859375, 2.611572265625, 2.76470947265625, 2.9178466796875, 3.07098388671875, 3.22412109375, 3.37725830078125, 3.5303955078125, 3.68353271484375, 3.836669921875, 3.98980712890625, 4.1429443359375, 4.29608154296875, 4.44921875]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 3.0, 3.0, 4.0, 12.0, 12.0, 17.0, 22.0, 30.0, 24.0, 43.0, 75.0, 98.0, 162.0, 214.0, 379.0, 527.0, 935.0, 1569.0, 2748.0, 5162.0, 10019.0, 21319.0, 50931.0, 151626.0, 528431.0, 1302299.0, 1321608.0, 542995.0, 157475.0, 52142.0, 21543.0, 10013.0, 5059.0, 2756.0, 1562.0, 946.0, 528.0, 336.0, 214.0, 145.0, 83.0, 56.0, 53.0, 22.0, 29.0, 24.0, 13.0, 5.0, 5.0, 4.0, 6.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-6.25, -6.0606689453125, -5.871337890625, -5.6820068359375, -5.49267578125, -5.3033447265625, -5.114013671875, -4.9246826171875, -4.7353515625, -4.5460205078125, -4.356689453125, -4.1673583984375, -3.97802734375, -3.7886962890625, -3.599365234375, -3.4100341796875, -3.220703125, -3.0313720703125, -2.842041015625, -2.6527099609375, -2.46337890625, -2.2740478515625, -2.084716796875, -1.8953857421875, -1.7060546875, -1.5167236328125, -1.327392578125, -1.1380615234375, -0.94873046875, -0.7593994140625, -0.570068359375, -0.3807373046875, -0.19140625, -0.0020751953125, 0.187255859375, 0.3765869140625, 0.56591796875, 0.7552490234375, 0.944580078125, 1.1339111328125, 1.3232421875, 1.5125732421875, 1.701904296875, 1.8912353515625, 2.08056640625, 2.2698974609375, 2.459228515625, 2.6485595703125, 2.837890625, 3.0272216796875, 3.216552734375, 3.4058837890625, 3.59521484375, 3.7845458984375, 3.973876953125, 4.1632080078125, 4.3525390625, 4.5418701171875, 4.731201171875, 4.9205322265625, 5.10986328125, 5.2991943359375, 5.488525390625, 5.6778564453125, 5.8671875]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 4.0, 1.0, 2.0, 5.0, 4.0, 6.0, 7.0, 18.0, 29.0, 37.0, 54.0, 63.0, 105.0, 119.0, 181.0, 228.0, 274.0, 450.0, 502.0, 471.0, 423.0, 291.0, 214.0, 171.0, 134.0, 87.0, 56.0, 41.0, 32.0, 26.0, 13.0, 11.0, 7.0, 5.0, 2.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.6640625, -11.2310791015625, -10.798095703125, -10.3651123046875, -9.93212890625, -9.4991455078125, -9.066162109375, -8.6331787109375, -8.2001953125, -7.7672119140625, -7.334228515625, -6.9012451171875, -6.46826171875, -6.0352783203125, -5.602294921875, -5.1693115234375, -4.736328125, -4.3033447265625, -3.870361328125, -3.4373779296875, -3.00439453125, -2.5714111328125, -2.138427734375, -1.7054443359375, -1.2724609375, -0.8394775390625, -0.406494140625, 0.0264892578125, 0.45947265625, 0.8924560546875, 1.325439453125, 1.7584228515625, 2.19140625, 2.6243896484375, 3.057373046875, 3.4903564453125, 3.92333984375, 4.3563232421875, 4.789306640625, 5.2222900390625, 5.6552734375, 6.0882568359375, 6.521240234375, 6.9542236328125, 7.38720703125, 7.8201904296875, 8.253173828125, 8.6861572265625, 9.119140625, 9.5521240234375, 9.985107421875, 10.4180908203125, 10.85107421875, 11.2840576171875, 11.717041015625, 12.1500244140625, 12.5830078125, 13.0159912109375, 13.448974609375, 13.8819580078125, 14.31494140625, 14.7479248046875, 15.180908203125, 15.6138916015625, 16.046875]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 3.0, 6.0, 9.0, 12.0, 18.0, 24.0, 49.0, 46.0, 70.0, 96.0, 145.0, 244.0, 405.0, 1084.0, 5460.0, 107353.0, 3670372.0, 393710.0, 12117.0, 1648.0, 558.0, 283.0, 177.0, 112.0, 82.0, 62.0, 39.0, 28.0, 22.0, 15.0, 8.0, 13.0, 4.0, 3.0, 3.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-27.5625, -26.34619140625, -25.1298828125, -23.91357421875, -22.697265625, -21.48095703125, -20.2646484375, -19.04833984375, -17.83203125, -16.61572265625, -15.3994140625, -14.18310546875, -12.966796875, -11.75048828125, -10.5341796875, -9.31787109375, -8.1015625, -6.88525390625, -5.6689453125, -4.45263671875, -3.236328125, -2.02001953125, -0.8037109375, 0.41259765625, 1.62890625, 2.84521484375, 4.0615234375, 5.27783203125, 6.494140625, 7.71044921875, 8.9267578125, 10.14306640625, 11.359375, 12.57568359375, 13.7919921875, 15.00830078125, 16.224609375, 17.44091796875, 18.6572265625, 19.87353515625, 21.08984375, 22.30615234375, 23.5224609375, 24.73876953125, 25.955078125, 27.17138671875, 28.3876953125, 29.60400390625, 30.8203125, 32.03662109375, 33.2529296875, 34.46923828125, 35.685546875, 36.90185546875, 38.1181640625, 39.33447265625, 40.55078125, 41.76708984375, 42.9833984375, 44.19970703125, 45.416015625, 46.63232421875, 47.8486328125, 49.06494140625, 50.28125]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 6.0, 20.0, 27.0, 45.0, 72.0, 108.0, 152.0, 153.0, 152.0, 113.0, 61.0, 44.0, 30.0, 19.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-123.60558319091797, -121.05137634277344, -118.49716186523438, -115.94295501708984, -113.38874816894531, -110.83454132080078, -108.28033447265625, -105.72611999511719, -103.17191314697266, -100.61770629882812, -98.06349182128906, -95.50928497314453, -92.955078125, -90.40087127685547, -87.84666442871094, -85.29244995117188, -82.73824310302734, -80.18403625488281, -77.62982177734375, -75.07561492919922, -72.52140808105469, -69.96720123291016, -67.41299438476562, -64.85877990722656, -62.30457305908203, -59.7503662109375, -57.1961555480957, -54.641944885253906, -52.087738037109375, -49.533531188964844, -46.97932052612305, -44.42510986328125, -41.87089538574219, -39.316688537597656, -36.76247787475586, -34.20826721191406, -31.65406036376953, -29.099851608276367, -26.545642852783203, -23.99143409729004, -21.437225341796875, -18.88301658630371, -16.328807830810547, -13.774599075317383, -11.220390319824219, -8.666181564331055, -6.111972808837891, -3.5577640533447266, -1.0035552978515625, 1.5506534576416016, 4.104862213134766, 6.65907096862793, 9.213279724121094, 11.767488479614258, 14.321697235107422, 16.875905990600586, 19.43011474609375, 21.984323501586914, 24.538532257080078, 27.092741012573242, 29.646949768066406, 32.20115661621094, 34.755367279052734, 37.30957794189453, 39.86378479003906]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 2.0, 8.0, 6.0, 5.0, 6.0, 2.0, 9.0, 8.0, 10.0, 6.0, 16.0, 14.0, 14.0, 23.0, 26.0, 14.0, 21.0, 24.0, 24.0, 29.0, 23.0, 35.0, 41.0, 36.0, 29.0, 46.0, 43.0, 36.0, 44.0, 37.0, 38.0, 41.0, 30.0, 34.0, 34.0, 20.0, 16.0, 21.0, 23.0, 15.0, 13.0, 16.0, 11.0, 7.0, 13.0, 6.0, 8.0, 5.0, 3.0, 4.0, 7.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-38.10260009765625, -36.93830108642578, -35.77400207519531, -34.60970687866211, -33.44540786743164, -32.28110885620117, -31.116811752319336, -29.9525146484375, -28.78821563720703, -27.623916625976562, -26.459619522094727, -25.29532241821289, -24.131023406982422, -22.966724395751953, -21.802427291870117, -20.63813018798828, -19.473831176757812, -18.309532165527344, -17.145235061645508, -15.980937004089355, -14.816638946533203, -13.65234088897705, -12.488042831420898, -11.323744773864746, -10.159446716308594, -8.995148658752441, -7.830850601196289, -6.666552543640137, -5.502254486083984, -4.337956428527832, -3.1736583709716797, -2.0093603134155273, -0.845062255859375, 0.31923580169677734, 1.4835338592529297, 2.647831916809082, 3.8121299743652344, 4.976428031921387, 6.140726089477539, 7.305024147033691, 8.469322204589844, 9.633620262145996, 10.797918319702148, 11.9622163772583, 13.126514434814453, 14.290812492370605, 15.455110549926758, 16.619407653808594, 17.783706665039062, 18.94800567626953, 20.112302780151367, 21.276599884033203, 22.440898895263672, 23.60519790649414, 24.769495010375977, 25.933792114257812, 27.09809112548828, 28.26239013671875, 29.426687240600586, 30.590984344482422, 31.75528335571289, 32.91958236694336, 34.08387756347656, 35.24817657470703, 36.4124755859375]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 8.0, 6.0, 5.0, 15.0, 5.0, 8.0, 16.0, 14.0, 23.0, 32.0, 18.0, 22.0, 36.0, 36.0, 31.0, 42.0, 40.0, 44.0, 49.0, 30.0, 37.0, 40.0, 33.0, 43.0, 40.0, 30.0, 40.0, 34.0, 24.0, 40.0, 24.0, 19.0, 20.0, 19.0, 13.0, 15.0, 11.0, 9.0, 8.0, 7.0, 6.0, 6.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-5.625, -5.458251953125, -5.29150390625, -5.124755859375, -4.9580078125, -4.791259765625, -4.62451171875, -4.457763671875, -4.291015625, -4.124267578125, -3.95751953125, -3.790771484375, -3.6240234375, -3.457275390625, -3.29052734375, -3.123779296875, -2.95703125, -2.790283203125, -2.62353515625, -2.456787109375, -2.2900390625, -2.123291015625, -1.95654296875, -1.789794921875, -1.623046875, -1.456298828125, -1.28955078125, -1.122802734375, -0.9560546875, -0.789306640625, -0.62255859375, -0.455810546875, -0.2890625, -0.122314453125, 0.04443359375, 0.211181640625, 0.3779296875, 0.544677734375, 0.71142578125, 0.878173828125, 1.044921875, 1.211669921875, 1.37841796875, 1.545166015625, 1.7119140625, 1.878662109375, 2.04541015625, 2.212158203125, 2.37890625, 2.545654296875, 2.71240234375, 2.879150390625, 3.0458984375, 3.212646484375, 3.37939453125, 3.546142578125, 3.712890625, 3.879638671875, 4.04638671875, 4.213134765625, 4.3798828125, 4.546630859375, 4.71337890625, 4.880126953125, 5.046875]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 9.0, 13.0, 16.0, 27.0, 39.0, 75.0, 85.0, 144.0, 220.0, 343.0, 562.0, 782.0, 1267.0, 1957.0, 2976.0, 4636.0, 7105.0, 11002.0, 17378.0, 27069.0, 42489.0, 66520.0, 102655.0, 150531.0, 180080.0, 148493.0, 100888.0, 65226.0, 41673.0, 26689.0, 16766.0, 10982.0, 7044.0, 4481.0, 2994.0, 1812.0, 1261.0, 778.0, 521.0, 333.0, 221.0, 145.0, 92.0, 70.0, 39.0, 28.0, 15.0, 9.0, 8.0, 5.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.54736328125, -0.5305099487304688, -0.5136566162109375, -0.49680328369140625, -0.479949951171875, -0.46309661865234375, -0.4462432861328125, -0.42938995361328125, -0.41253662109375, -0.39568328857421875, -0.3788299560546875, -0.36197662353515625, -0.345123291015625, -0.32826995849609375, -0.3114166259765625, -0.29456329345703125, -0.2777099609375, -0.26085662841796875, -0.2440032958984375, -0.22714996337890625, -0.210296630859375, -0.19344329833984375, -0.1765899658203125, -0.15973663330078125, -0.14288330078125, -0.12602996826171875, -0.1091766357421875, -0.09232330322265625, -0.075469970703125, -0.05861663818359375, -0.0417633056640625, -0.02490997314453125, -0.008056640625, 0.00879669189453125, 0.0256500244140625, 0.04250335693359375, 0.059356689453125, 0.07621002197265625, 0.0930633544921875, 0.10991668701171875, 0.12677001953125, 0.14362335205078125, 0.1604766845703125, 0.17733001708984375, 0.194183349609375, 0.21103668212890625, 0.2278900146484375, 0.24474334716796875, 0.2615966796875, 0.27845001220703125, 0.2953033447265625, 0.31215667724609375, 0.329010009765625, 0.34586334228515625, 0.3627166748046875, 0.37957000732421875, 0.39642333984375, 0.41327667236328125, 0.4301300048828125, 0.44698333740234375, 0.463836669921875, 0.48069000244140625, 0.4975433349609375, 0.5143966674804688, 0.53125]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 3.0, 4.0, 11.0, 10.0, 10.0, 15.0, 14.0, 12.0, 19.0, 22.0, 19.0, 21.0, 25.0, 33.0, 26.0, 33.0, 48.0, 40.0, 42.0, 36.0, 1066.0, 49.0, 35.0, 54.0, 44.0, 41.0, 36.0, 23.0, 28.0, 35.0, 28.0, 19.0, 23.0, 18.0, 23.0, 9.0, 16.0, 8.0, 5.0, 6.0, 8.0, 6.0, 0.0, 1.0, 4.0, 1.0, 0.0, 2.0], "bins": [-3.892578125, -3.78668212890625, -3.6807861328125, -3.57489013671875, -3.468994140625, -3.36309814453125, -3.2572021484375, -3.15130615234375, -3.04541015625, -2.93951416015625, -2.8336181640625, -2.72772216796875, -2.621826171875, -2.51593017578125, -2.4100341796875, -2.30413818359375, -2.1982421875, -2.09234619140625, -1.9864501953125, -1.88055419921875, -1.774658203125, -1.66876220703125, -1.5628662109375, -1.45697021484375, -1.35107421875, -1.24517822265625, -1.1392822265625, -1.03338623046875, -0.927490234375, -0.82159423828125, -0.7156982421875, -0.60980224609375, -0.50390625, -0.39801025390625, -0.2921142578125, -0.18621826171875, -0.080322265625, 0.02557373046875, 0.1314697265625, 0.23736572265625, 0.34326171875, 0.44915771484375, 0.5550537109375, 0.66094970703125, 0.766845703125, 0.87274169921875, 0.9786376953125, 1.08453369140625, 1.1904296875, 1.29632568359375, 1.4022216796875, 1.50811767578125, 1.614013671875, 1.71990966796875, 1.8258056640625, 1.93170166015625, 2.03759765625, 2.14349365234375, 2.2493896484375, 2.35528564453125, 2.461181640625, 2.56707763671875, 2.6729736328125, 2.77886962890625, 2.884765625]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 9.0, 5.0, 13.0, 8.0, 29.0, 47.0, 44.0, 79.0, 94.0, 188.0, 245.0, 372.0, 552.0, 904.0, 1288.0, 2064.0, 3070.0, 4614.0, 6891.0, 10818.0, 16144.0, 25087.0, 37506.0, 56598.0, 83411.0, 116957.0, 223890.0, 1117129.0, 122062.0, 88863.0, 60573.0, 40381.0, 26397.0, 17427.0, 11332.0, 7484.0, 4846.0, 3329.0, 2184.0, 1436.0, 969.0, 578.0, 390.0, 278.0, 189.0, 119.0, 85.0, 63.0, 34.0, 23.0, 23.0, 14.0, 2.0, 5.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.355224609375, -0.34415435791015625, -0.3330841064453125, -0.32201385498046875, -0.310943603515625, -0.29987335205078125, -0.2888031005859375, -0.27773284912109375, -0.26666259765625, -0.25559234619140625, -0.2445220947265625, -0.23345184326171875, -0.222381591796875, -0.21131134033203125, -0.2002410888671875, -0.18917083740234375, -0.1781005859375, -0.16703033447265625, -0.1559600830078125, -0.14488983154296875, -0.133819580078125, -0.12274932861328125, -0.1116790771484375, -0.10060882568359375, -0.08953857421875, -0.07846832275390625, -0.0673980712890625, -0.05632781982421875, -0.045257568359375, -0.03418731689453125, -0.0231170654296875, -0.01204681396484375, -0.0009765625, 0.01009368896484375, 0.0211639404296875, 0.03223419189453125, 0.043304443359375, 0.05437469482421875, 0.0654449462890625, 0.07651519775390625, 0.08758544921875, 0.09865570068359375, 0.1097259521484375, 0.12079620361328125, 0.131866455078125, 0.14293670654296875, 0.1540069580078125, 0.16507720947265625, 0.1761474609375, 0.18721771240234375, 0.1982879638671875, 0.20935821533203125, 0.220428466796875, 0.23149871826171875, 0.2425689697265625, 0.25363922119140625, 0.26470947265625, 0.27577972412109375, 0.2868499755859375, 0.29792022705078125, 0.308990478515625, 0.32006072998046875, 0.3311309814453125, 0.34220123291015625, 0.353271484375]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 5.0, 0.0, 0.0, 4.0, 1.0, 3.0, 4.0, 3.0, 5.0, 6.0, 16.0, 19.0, 11.0, 17.0, 12.0, 24.0, 21.0, 25.0, 38.0, 45.0, 53.0, 73.0, 66.0, 66.0, 75.0, 69.0, 66.0, 54.0, 38.0, 35.0, 31.0, 35.0, 16.0, 11.0, 12.0, 14.0, 12.0, 6.0, 5.0, 5.0, 2.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.003917694091796875, -0.003775477409362793, -0.003633260726928711, -0.003491044044494629, -0.003348827362060547, -0.003206610679626465, -0.003064393997192383, -0.0029221773147583008, -0.0027799606323242188, -0.0026377439498901367, -0.0024955272674560547, -0.0023533105850219727, -0.0022110939025878906, -0.0020688772201538086, -0.0019266605377197266, -0.0017844438552856445, -0.0016422271728515625, -0.0015000104904174805, -0.0013577938079833984, -0.0012155771255493164, -0.0010733604431152344, -0.0009311437606811523, -0.0007889270782470703, -0.0006467103958129883, -0.0005044937133789062, -0.0003622770309448242, -0.0002200603485107422, -7.784366607666016e-05, 6.437301635742188e-05, 0.0002065896987915039, 0.00034880638122558594, 0.000491023063659668, 0.00063323974609375, 0.000775456428527832, 0.0009176731109619141, 0.001059889793395996, 0.0012021064758300781, 0.0013443231582641602, 0.0014865398406982422, 0.0016287565231323242, 0.0017709732055664062, 0.0019131898880004883, 0.0020554065704345703, 0.0021976232528686523, 0.0023398399353027344, 0.0024820566177368164, 0.0026242733001708984, 0.0027664899826049805, 0.0029087066650390625, 0.0030509233474731445, 0.0031931400299072266, 0.0033353567123413086, 0.0034775733947753906, 0.0036197900772094727, 0.0037620067596435547, 0.0039042234420776367, 0.004046440124511719, 0.004188656806945801, 0.004330873489379883, 0.004473090171813965, 0.004615306854248047, 0.004757523536682129, 0.004899740219116211, 0.005041956901550293, 0.005184173583984375]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 5.0, 7.0, 12.0, 19.0, 18.0, 24.0, 28.0, 47.0, 66.0, 93.0, 136.0, 178.0, 296.0, 521.0, 2716.0, 823777.0, 217757.0, 1543.0, 449.0, 282.0, 157.0, 127.0, 70.0, 55.0, 34.0, 37.0, 25.0, 21.0, 14.0, 14.0, 6.0, 3.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 0.0, 1.0], "bins": [-0.10418701171875, -0.1013631820678711, -0.09853935241699219, -0.09571552276611328, -0.09289169311523438, -0.09006786346435547, -0.08724403381347656, -0.08442020416259766, -0.08159637451171875, -0.07877254486083984, -0.07594871520996094, -0.07312488555908203, -0.07030105590820312, -0.06747722625732422, -0.06465339660644531, -0.061829566955566406, -0.0590057373046875, -0.056181907653808594, -0.05335807800292969, -0.05053424835205078, -0.047710418701171875, -0.04488658905029297, -0.04206275939941406, -0.039238929748535156, -0.03641510009765625, -0.033591270446777344, -0.030767440795898438, -0.02794361114501953, -0.025119781494140625, -0.02229595184326172, -0.019472122192382812, -0.016648292541503906, -0.013824462890625, -0.011000633239746094, -0.008176803588867188, -0.005352973937988281, -0.002529144287109375, 0.00029468536376953125, 0.0031185150146484375, 0.005942344665527344, 0.00876617431640625, 0.011590003967285156, 0.014413833618164062, 0.01723766326904297, 0.020061492919921875, 0.02288532257080078, 0.025709152221679688, 0.028532981872558594, 0.0313568115234375, 0.034180641174316406, 0.03700447082519531, 0.03982830047607422, 0.042652130126953125, 0.04547595977783203, 0.04829978942871094, 0.051123619079589844, 0.05394744873046875, 0.056771278381347656, 0.05959510803222656, 0.06241893768310547, 0.06524276733398438, 0.06806659698486328, 0.07089042663574219, 0.0737142562866211, 0.0765380859375]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 13.0, 850.0, 151.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0566568598151207, -0.05529935285449028, -0.05394184589385986, -0.052584342658519745, -0.05122683569788933, -0.04986932873725891, -0.048511821776628494, -0.04715431481599808, -0.04579680785536766, -0.044439300894737244, -0.04308179393410683, -0.04172428697347641, -0.04036678373813629, -0.039009276777505875, -0.03765176981687546, -0.03629426285624504, -0.034936755895614624, -0.03357924893498421, -0.03222174197435379, -0.030864236876368523, -0.029506729915738106, -0.028149224817752838, -0.02679171785712242, -0.025434210896492004, -0.024076707661151886, -0.02271920070052147, -0.0213616956025362, -0.020004188641905785, -0.018646681681275368, -0.0172891765832901, -0.015931669622659683, -0.014574162662029266, -0.013216657564043999, -0.011859151534736156, -0.01050164457410574, -0.009144138544797897, -0.007786632049828768, -0.006429125554859638, -0.005071619525551796, -0.003714112564921379, -0.002356606535613537, -0.000999100157059729, 0.00035840622149407864, 0.0017159124836325645, 0.003073418978601694, 0.004430925473570824, 0.005788431502878666, 0.007145938463509083, 0.008503444492816925, 0.009860950522124767, 0.011218457482755184, 0.012575963512063026, 0.013933470472693443, 0.015290976502001286, 0.016648482531309128, 0.018005989491939545, 0.01936349645256996, 0.02072100341320038, 0.022078508511185646, 0.023436015471816063, 0.02479352243244648, 0.026151027530431747, 0.027508534491062164, 0.02886604145169258, 0.03022354654967785]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 5.0, 5.0, 4.0, 5.0, 11.0, 14.0, 20.0, 21.0, 23.0, 19.0, 35.0, 32.0, 34.0, 43.0, 45.0, 45.0, 42.0, 58.0, 37.0, 53.0, 44.0, 42.0, 42.0, 42.0, 42.0, 41.0, 35.0, 33.0, 27.0, 15.0, 23.0, 20.0, 7.0, 18.0, 11.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0031978487968444824, -0.0031014643609523773, -0.003005079925060272, -0.002908695489168167, -0.002812311053276062, -0.002715926617383957, -0.002619542181491852, -0.0025231577455997467, -0.0024267733097076416, -0.0023303888738155365, -0.0022340044379234314, -0.0021376200020313263, -0.002041235566139221, -0.001944851130247116, -0.001848466694355011, -0.0017520822584629059, -0.0016556978225708008, -0.0015593133866786957, -0.0014629289507865906, -0.0013665445148944855, -0.0012701600790023804, -0.0011737756431102753, -0.0010773912072181702, -0.000981006771326065, -0.00088462233543396, -0.0007882378995418549, -0.0006918534636497498, -0.0005954690277576447, -0.0004990845918655396, -0.00040270015597343445, -0.00030631572008132935, -0.00020993128418922424, -0.00011354684829711914, -1.7162412405014038e-05, 7.922202348709106e-05, 0.00017560645937919617, 0.00027199089527130127, 0.00036837533116340637, 0.0004647597670555115, 0.0005611442029476166, 0.0006575286388397217, 0.0007539130747318268, 0.0008502975106239319, 0.000946681946516037, 0.001043066382408142, 0.0011394508183002472, 0.0012358352541923523, 0.0013322196900844574, 0.0014286041259765625, 0.0015249885618686676, 0.0016213729977607727, 0.0017177574336528778, 0.001814141869544983, 0.001910526305437088, 0.002006910741329193, 0.0021032951772212982, 0.0021996796131134033, 0.0022960640490055084, 0.0023924484848976135, 0.0024888329207897186, 0.0025852173566818237, 0.002681601792573929, 0.002777986228466034, 0.002874370664358139, 0.002970755100250244]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 8.0, 6.0, 5.0, 15.0, 5.0, 8.0, 16.0, 14.0, 23.0, 32.0, 18.0, 22.0, 36.0, 36.0, 31.0, 41.0, 41.0, 44.0, 49.0, 30.0, 37.0, 40.0, 33.0, 43.0, 40.0, 30.0, 40.0, 34.0, 24.0, 40.0, 24.0, 19.0, 20.0, 19.0, 13.0, 15.0, 11.0, 9.0, 8.0, 7.0, 6.0, 6.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-5.625, -5.458251953125, -5.29150390625, -5.124755859375, -4.9580078125, -4.791259765625, -4.62451171875, -4.457763671875, -4.291015625, -4.124267578125, -3.95751953125, -3.790771484375, -3.6240234375, -3.457275390625, -3.29052734375, -3.123779296875, -2.95703125, -2.790283203125, -2.62353515625, -2.456787109375, -2.2900390625, -2.123291015625, -1.95654296875, -1.789794921875, -1.623046875, -1.456298828125, -1.28955078125, -1.122802734375, -0.9560546875, -0.789306640625, -0.62255859375, -0.455810546875, -0.2890625, -0.122314453125, 0.04443359375, 0.211181640625, 0.3779296875, 0.544677734375, 0.71142578125, 0.878173828125, 1.044921875, 1.211669921875, 1.37841796875, 1.545166015625, 1.7119140625, 1.878662109375, 2.04541015625, 2.212158203125, 2.37890625, 2.545654296875, 2.71240234375, 2.879150390625, 3.0458984375, 3.212646484375, 3.37939453125, 3.546142578125, 3.712890625, 3.879638671875, 4.04638671875, 4.213134765625, 4.3798828125, 4.546630859375, 4.71337890625, 4.880126953125, 5.046875]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 9.0, 4.0, 4.0, 6.0, 13.0, 24.0, 35.0, 33.0, 79.0, 91.0, 129.0, 187.0, 282.0, 410.0, 537.0, 849.0, 1288.0, 1938.0, 3205.0, 5699.0, 11385.0, 26710.0, 78535.0, 295515.0, 427141.0, 123202.0, 38021.0, 15156.0, 7294.0, 3963.0, 2262.0, 1478.0, 935.0, 651.0, 451.0, 357.0, 225.0, 136.0, 97.0, 71.0, 57.0, 29.0, 27.0, 11.0, 12.0, 8.0, 8.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.05859375, -3.91949462890625, -3.7803955078125, -3.64129638671875, -3.502197265625, -3.36309814453125, -3.2239990234375, -3.08489990234375, -2.94580078125, -2.80670166015625, -2.6676025390625, -2.52850341796875, -2.389404296875, -2.25030517578125, -2.1112060546875, -1.97210693359375, -1.8330078125, -1.69390869140625, -1.5548095703125, -1.41571044921875, -1.276611328125, -1.13751220703125, -0.9984130859375, -0.85931396484375, -0.72021484375, -0.58111572265625, -0.4420166015625, -0.30291748046875, -0.163818359375, -0.02471923828125, 0.1143798828125, 0.25347900390625, 0.392578125, 0.53167724609375, 0.6707763671875, 0.80987548828125, 0.948974609375, 1.08807373046875, 1.2271728515625, 1.36627197265625, 1.50537109375, 1.64447021484375, 1.7835693359375, 1.92266845703125, 2.061767578125, 2.20086669921875, 2.3399658203125, 2.47906494140625, 2.6181640625, 2.75726318359375, 2.8963623046875, 3.03546142578125, 3.174560546875, 3.31365966796875, 3.4527587890625, 3.59185791015625, 3.73095703125, 3.87005615234375, 4.0091552734375, 4.14825439453125, 4.287353515625, 4.42645263671875, 4.5655517578125, 4.70465087890625, 4.84375]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 5.0, 1.0, 7.0, 5.0, 4.0, 5.0, 6.0, 6.0, 8.0, 11.0, 11.0, 14.0, 15.0, 21.0, 26.0, 28.0, 26.0, 35.0, 33.0, 32.0, 37.0, 43.0, 60.0, 105.0, 345.0, 1569.0, 127.0, 72.0, 42.0, 43.0, 28.0, 34.0, 37.0, 32.0, 22.0, 26.0, 17.0, 19.0, 21.0, 14.0, 11.0, 6.0, 11.0, 6.0, 11.0, 3.0, 7.0, 6.0, 2.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.9375, -16.393310546875, -15.84912109375, -15.304931640625, -14.7607421875, -14.216552734375, -13.67236328125, -13.128173828125, -12.583984375, -12.039794921875, -11.49560546875, -10.951416015625, -10.4072265625, -9.863037109375, -9.31884765625, -8.774658203125, -8.23046875, -7.686279296875, -7.14208984375, -6.597900390625, -6.0537109375, -5.509521484375, -4.96533203125, -4.421142578125, -3.876953125, -3.332763671875, -2.78857421875, -2.244384765625, -1.7001953125, -1.156005859375, -0.61181640625, -0.067626953125, 0.4765625, 1.020751953125, 1.56494140625, 2.109130859375, 2.6533203125, 3.197509765625, 3.74169921875, 4.285888671875, 4.830078125, 5.374267578125, 5.91845703125, 6.462646484375, 7.0068359375, 7.551025390625, 8.09521484375, 8.639404296875, 9.18359375, 9.727783203125, 10.27197265625, 10.816162109375, 11.3603515625, 11.904541015625, 12.44873046875, 12.992919921875, 13.537109375, 14.081298828125, 14.62548828125, 15.169677734375, 15.7138671875, 16.258056640625, 16.80224609375, 17.346435546875, 17.890625]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 5.0, 2.0, 4.0, 9.0, 6.0, 11.0, 12.0, 7.0, 9.0, 19.0, 14.0, 21.0, 35.0, 25.0, 42.0, 55.0, 85.0, 97.0, 107.0, 167.0, 218.0, 376.0, 1278.0, 17145.0, 3054831.0, 67267.0, 2312.0, 523.0, 286.0, 185.0, 118.0, 92.0, 76.0, 52.0, 45.0, 34.0, 25.0, 20.0, 22.0, 10.0, 8.0, 10.0, 5.0, 8.0, 6.0, 8.0, 10.0, 6.0, 3.0, 3.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-35.84375, -34.74609375, -33.6484375, -32.55078125, -31.453125, -30.35546875, -29.2578125, -28.16015625, -27.0625, -25.96484375, -24.8671875, -23.76953125, -22.671875, -21.57421875, -20.4765625, -19.37890625, -18.28125, -17.18359375, -16.0859375, -14.98828125, -13.890625, -12.79296875, -11.6953125, -10.59765625, -9.5, -8.40234375, -7.3046875, -6.20703125, -5.109375, -4.01171875, -2.9140625, -1.81640625, -0.71875, 0.37890625, 1.4765625, 2.57421875, 3.671875, 4.76953125, 5.8671875, 6.96484375, 8.0625, 9.16015625, 10.2578125, 11.35546875, 12.453125, 13.55078125, 14.6484375, 15.74609375, 16.84375, 17.94140625, 19.0390625, 20.13671875, 21.234375, 22.33203125, 23.4296875, 24.52734375, 25.625, 26.72265625, 27.8203125, 28.91796875, 30.015625, 31.11328125, 32.2109375, 33.30859375, 34.40625]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [37.0, 929.0, 49.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.242090225219727, -3.6338396072387695, 2.9744110107421875, 9.582662582397461, 16.1909122467041, 22.799161911010742, 29.40741539001465, 36.015663146972656, 42.62391662597656, 49.2321662902832, 55.840415954589844, 62.44866943359375, 69.05691528320312, 75.66516876220703, 82.27342224121094, 88.88166809082031, 95.48992156982422, 102.09817504882812, 108.7064208984375, 115.3146743774414, 121.92292785644531, 128.5311737060547, 135.13943481445312, 141.7476806640625, 148.35592651367188, 154.96417236328125, 161.5724334716797, 168.18067932128906, 174.78892517089844, 181.39718627929688, 188.00543212890625, 194.61367797851562, 201.221923828125, 207.83016967773438, 214.4384307861328, 221.0466766357422, 227.65492248535156, 234.26318359375, 240.87142944335938, 247.47967529296875, 254.08792114257812, 260.6961669921875, 267.3044128417969, 273.91265869140625, 280.52093505859375, 287.1291809082031, 293.7374267578125, 300.3456726074219, 306.95391845703125, 313.5621643066406, 320.17041015625, 326.7786865234375, 333.3869323730469, 339.99517822265625, 346.6034240722656, 353.211669921875, 359.8199462890625, 366.4281921386719, 373.03643798828125, 379.64471435546875, 386.2529602050781, 392.8612060546875, 399.4694519042969, 406.07769775390625, 412.6859436035156]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 2.0, 7.0, 3.0, 6.0, 9.0, 5.0, 11.0, 7.0, 18.0, 17.0, 21.0, 22.0, 20.0, 17.0, 25.0, 36.0, 38.0, 27.0, 37.0, 45.0, 43.0, 28.0, 37.0, 43.0, 47.0, 35.0, 35.0, 28.0, 36.0, 44.0, 39.0, 31.0, 26.0, 26.0, 24.0, 17.0, 22.0, 15.0, 13.0, 7.0, 10.0, 5.0, 9.0, 5.0, 7.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-51.54712677001953, -50.032745361328125, -48.51836013793945, -47.00397872924805, -45.489593505859375, -43.97521209716797, -42.46083068847656, -40.94644546508789, -39.43206024169922, -37.91767883300781, -36.40329360961914, -34.888912200927734, -33.37452697753906, -31.860145568847656, -30.345762252807617, -28.831378936767578, -27.316997528076172, -25.802614212036133, -24.288230895996094, -22.773849487304688, -21.259464263916016, -19.74508285522461, -18.23069953918457, -16.71631622314453, -15.201932907104492, -13.687549591064453, -12.173166275024414, -10.658783912658691, -9.144400596618652, -7.630017280578613, -6.115634918212891, -4.601251602172852, -3.0868682861328125, -1.5724852085113525, -0.05810213088989258, 1.4562807083129883, 2.9706640243530273, 4.485047340393066, 5.999429702758789, 7.513813018798828, 9.028196334838867, 10.542579650878906, 12.056962966918945, 13.571345329284668, 15.085728645324707, 16.600112915039062, 18.11449432373047, 19.628877639770508, 21.143260955810547, 22.657644271850586, 24.172027587890625, 25.68640899658203, 27.200794219970703, 28.71517562866211, 30.22955894470215, 31.743942260742188, 33.258323669433594, 34.772705078125, 36.28709030151367, 37.80147171020508, 39.31585693359375, 40.830238342285156, 42.34461975097656, 43.859004974365234, 45.373390197753906]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 7.0, 12.0, 8.0, 8.0, 7.0, 8.0, 12.0, 21.0, 24.0, 18.0, 25.0, 27.0, 34.0, 40.0, 39.0, 33.0, 39.0, 53.0, 41.0, 43.0, 34.0, 40.0, 36.0, 37.0, 42.0, 27.0, 46.0, 29.0, 27.0, 20.0, 33.0, 25.0, 19.0, 20.0, 16.0, 12.0, 7.0, 8.0, 8.0, 5.0, 4.0, 7.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-5.9609375, -5.78814697265625, -5.6153564453125, -5.44256591796875, -5.269775390625, -5.09698486328125, -4.9241943359375, -4.75140380859375, -4.57861328125, -4.40582275390625, -4.2330322265625, -4.06024169921875, -3.887451171875, -3.71466064453125, -3.5418701171875, -3.36907958984375, -3.1962890625, -3.02349853515625, -2.8507080078125, -2.67791748046875, -2.505126953125, -2.33233642578125, -2.1595458984375, -1.98675537109375, -1.81396484375, -1.64117431640625, -1.4683837890625, -1.29559326171875, -1.122802734375, -0.95001220703125, -0.7772216796875, -0.60443115234375, -0.431640625, -0.25885009765625, -0.0860595703125, 0.08673095703125, 0.259521484375, 0.43231201171875, 0.6051025390625, 0.77789306640625, 0.95068359375, 1.12347412109375, 1.2962646484375, 1.46905517578125, 1.641845703125, 1.81463623046875, 1.9874267578125, 2.16021728515625, 2.3330078125, 2.50579833984375, 2.6785888671875, 2.85137939453125, 3.024169921875, 3.19696044921875, 3.3697509765625, 3.54254150390625, 3.71533203125, 3.88812255859375, 4.0609130859375, 4.23370361328125, 4.406494140625, 4.57928466796875, 4.7520751953125, 4.92486572265625, 5.09765625]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 7.0, 8.0, 11.0, 8.0, 11.0, 16.0, 21.0, 13.0, 21.0, 29.0, 29.0, 45.0, 52.0, 67.0, 96.0, 159.0, 369.0, 2157.0, 26198.0, 1786726.0, 2340829.0, 34047.0, 2370.0, 402.0, 133.0, 107.0, 72.0, 50.0, 46.0, 26.0, 26.0, 28.0, 16.0, 19.0, 14.0, 11.0, 10.0, 8.0, 8.0, 3.0, 7.0, 3.0, 3.0, 1.0, 2.0, 3.0, 2.0, 2.0], "bins": [-30.796875, -29.9423828125, -29.087890625, -28.2333984375, -27.37890625, -26.5244140625, -25.669921875, -24.8154296875, -23.9609375, -23.1064453125, -22.251953125, -21.3974609375, -20.54296875, -19.6884765625, -18.833984375, -17.9794921875, -17.125, -16.2705078125, -15.416015625, -14.5615234375, -13.70703125, -12.8525390625, -11.998046875, -11.1435546875, -10.2890625, -9.4345703125, -8.580078125, -7.7255859375, -6.87109375, -6.0166015625, -5.162109375, -4.3076171875, -3.453125, -2.5986328125, -1.744140625, -0.8896484375, -0.03515625, 0.8193359375, 1.673828125, 2.5283203125, 3.3828125, 4.2373046875, 5.091796875, 5.9462890625, 6.80078125, 7.6552734375, 8.509765625, 9.3642578125, 10.21875, 11.0732421875, 11.927734375, 12.7822265625, 13.63671875, 14.4912109375, 15.345703125, 16.2001953125, 17.0546875, 17.9091796875, 18.763671875, 19.6181640625, 20.47265625, 21.3271484375, 22.181640625, 23.0361328125, 23.890625]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 2.0, 6.0, 4.0, 12.0, 8.0, 18.0, 23.0, 37.0, 42.0, 54.0, 91.0, 134.0, 161.0, 226.0, 327.0, 405.0, 513.0, 489.0, 427.0, 330.0, 229.0, 155.0, 131.0, 82.0, 59.0, 28.0, 31.0, 14.0, 11.0, 10.0, 6.0, 6.0, 3.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.3515625, -11.924072265625, -11.49658203125, -11.069091796875, -10.6416015625, -10.214111328125, -9.78662109375, -9.359130859375, -8.931640625, -8.504150390625, -8.07666015625, -7.649169921875, -7.2216796875, -6.794189453125, -6.36669921875, -5.939208984375, -5.51171875, -5.084228515625, -4.65673828125, -4.229248046875, -3.8017578125, -3.374267578125, -2.94677734375, -2.519287109375, -2.091796875, -1.664306640625, -1.23681640625, -0.809326171875, -0.3818359375, 0.045654296875, 0.47314453125, 0.900634765625, 1.328125, 1.755615234375, 2.18310546875, 2.610595703125, 3.0380859375, 3.465576171875, 3.89306640625, 4.320556640625, 4.748046875, 5.175537109375, 5.60302734375, 6.030517578125, 6.4580078125, 6.885498046875, 7.31298828125, 7.740478515625, 8.16796875, 8.595458984375, 9.02294921875, 9.450439453125, 9.8779296875, 10.305419921875, 10.73291015625, 11.160400390625, 11.587890625, 12.015380859375, 12.44287109375, 12.870361328125, 13.2978515625, 13.725341796875, 14.15283203125, 14.580322265625, 15.0078125]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 6.0, 5.0, 12.0, 13.0, 12.0, 21.0, 31.0, 42.0, 54.0, 62.0, 98.0, 139.0, 186.0, 296.0, 547.0, 1692.0, 21048.0, 1729504.0, 2410485.0, 26489.0, 1977.0, 526.0, 315.0, 188.0, 132.0, 104.0, 83.0, 56.0, 45.0, 18.0, 26.0, 16.0, 20.0, 6.0, 8.0, 11.0, 3.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-42.53125, -41.20361328125, -39.8759765625, -38.54833984375, -37.220703125, -35.89306640625, -34.5654296875, -33.23779296875, -31.91015625, -30.58251953125, -29.2548828125, -27.92724609375, -26.599609375, -25.27197265625, -23.9443359375, -22.61669921875, -21.2890625, -19.96142578125, -18.6337890625, -17.30615234375, -15.978515625, -14.65087890625, -13.3232421875, -11.99560546875, -10.66796875, -9.34033203125, -8.0126953125, -6.68505859375, -5.357421875, -4.02978515625, -2.7021484375, -1.37451171875, -0.046875, 1.28076171875, 2.6083984375, 3.93603515625, 5.263671875, 6.59130859375, 7.9189453125, 9.24658203125, 10.57421875, 11.90185546875, 13.2294921875, 14.55712890625, 15.884765625, 17.21240234375, 18.5400390625, 19.86767578125, 21.1953125, 22.52294921875, 23.8505859375, 25.17822265625, 26.505859375, 27.83349609375, 29.1611328125, 30.48876953125, 31.81640625, 33.14404296875, 34.4716796875, 35.79931640625, 37.126953125, 38.45458984375, 39.7822265625, 41.10986328125, 42.4375]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 13.0, 26.0, 67.0, 90.0, 142.0, 225.0, 167.0, 140.0, 71.0, 45.0, 17.0, 8.0, 1.0, 3.0], "bins": [-175.13687133789062, -171.99627685546875, -168.85569763183594, -165.71511840820312, -162.57452392578125, -159.43392944335938, -156.29335021972656, -153.15277099609375, -150.01217651367188, -146.87158203125, -143.7310028076172, -140.59042358398438, -137.4498291015625, -134.30923461914062, -131.1686553955078, -128.028076171875, -124.88748168945312, -121.74689483642578, -118.60630798339844, -115.4657211303711, -112.32513427734375, -109.1845474243164, -106.04396057128906, -102.90337371826172, -99.76278686523438, -96.62220001220703, -93.48161315917969, -90.34102630615234, -87.200439453125, -84.05985260009766, -80.91926574707031, -77.77867889404297, -74.63809204101562, -71.49750518798828, -68.35691833496094, -65.2163314819336, -62.07574462890625, -58.935157775878906, -55.79457092285156, -52.65398406982422, -49.513397216796875, -46.37281036376953, -43.23222351074219, -40.091636657714844, -36.9510498046875, -33.810462951660156, -30.669876098632812, -27.52928924560547, -24.388702392578125, -21.24811553955078, -18.107528686523438, -14.966941833496094, -11.82635498046875, -8.685768127441406, -5.5451812744140625, -2.4045944213867188, 0.735992431640625, 3.8765792846679688, 7.0171661376953125, 10.157752990722656, 13.29833984375, 16.438926696777344, 19.579513549804688, 22.72010040283203, 25.860687255859375]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 4.0, 3.0, 9.0, 10.0, 1.0, 12.0, 15.0, 6.0, 11.0, 10.0, 18.0, 21.0, 25.0, 21.0, 29.0, 28.0, 27.0, 26.0, 25.0, 37.0, 51.0, 31.0, 43.0, 27.0, 50.0, 39.0, 37.0, 36.0, 36.0, 34.0, 35.0, 28.0, 27.0, 30.0, 21.0, 18.0, 24.0, 24.0, 19.0, 15.0, 11.0, 5.0, 4.0, 5.0, 8.0, 2.0, 3.0, 2.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-35.52217102050781, -34.38365936279297, -33.245147705078125, -32.10663604736328, -30.968124389648438, -29.829612731933594, -28.691099166870117, -27.552587509155273, -26.41407585144043, -25.275564193725586, -24.137052536010742, -22.9985408782959, -21.860027313232422, -20.721515655517578, -19.583003997802734, -18.44449234008789, -17.305980682373047, -16.167469024658203, -15.02895736694336, -13.8904447555542, -12.751933097839355, -11.613421440124512, -10.474908828735352, -9.336397171020508, -8.197885513305664, -7.05937385559082, -5.920861721038818, -4.782349586486816, -3.6438379287719727, -2.505326271057129, -1.366814136505127, -0.228302001953125, 0.9102096557617188, 2.0487215518951416, 3.1872334480285645, 4.325745582580566, 5.46425724029541, 6.602768898010254, 7.741281032562256, 8.879793167114258, 10.018304824829102, 11.156816482543945, 12.295328140258789, 13.43384075164795, 14.572352409362793, 15.710864067077637, 16.849376678466797, 17.98788833618164, 19.126399993896484, 20.264911651611328, 21.403423309326172, 22.541934967041016, 23.68044662475586, 24.818958282470703, 25.95747184753418, 27.095983505249023, 28.234495162963867, 29.37300682067871, 30.511518478393555, 31.6500301361084, 32.788543701171875, 33.92705535888672, 35.06556701660156, 36.204078674316406, 37.34259033203125]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 6.0, 7.0, 6.0, 9.0, 9.0, 11.0, 13.0, 11.0, 16.0, 17.0, 18.0, 27.0, 25.0, 35.0, 26.0, 29.0, 40.0, 23.0, 40.0, 34.0, 32.0, 35.0, 43.0, 33.0, 45.0, 24.0, 29.0, 36.0, 31.0, 43.0, 32.0, 18.0, 25.0, 20.0, 18.0, 25.0, 20.0, 12.0, 11.0, 13.0, 10.0, 9.0, 12.0, 6.0, 5.0, 8.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0], "bins": [-4.82421875, -4.66900634765625, -4.5137939453125, -4.35858154296875, -4.203369140625, -4.04815673828125, -3.8929443359375, -3.73773193359375, -3.58251953125, -3.42730712890625, -3.2720947265625, -3.11688232421875, -2.961669921875, -2.80645751953125, -2.6512451171875, -2.49603271484375, -2.3408203125, -2.18560791015625, -2.0303955078125, -1.87518310546875, -1.719970703125, -1.56475830078125, -1.4095458984375, -1.25433349609375, -1.09912109375, -0.94390869140625, -0.7886962890625, -0.63348388671875, -0.478271484375, -0.32305908203125, -0.1678466796875, -0.01263427734375, 0.142578125, 0.29779052734375, 0.4530029296875, 0.60821533203125, 0.763427734375, 0.91864013671875, 1.0738525390625, 1.22906494140625, 1.38427734375, 1.53948974609375, 1.6947021484375, 1.84991455078125, 2.005126953125, 2.16033935546875, 2.3155517578125, 2.47076416015625, 2.6259765625, 2.78118896484375, 2.9364013671875, 3.09161376953125, 3.246826171875, 3.40203857421875, 3.5572509765625, 3.71246337890625, 3.86767578125, 4.02288818359375, 4.1781005859375, 4.33331298828125, 4.488525390625, 4.64373779296875, 4.7989501953125, 4.95416259765625, 5.109375]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 9.0, 5.0, 17.0, 39.0, 34.0, 78.0, 118.0, 198.0, 333.0, 597.0, 936.0, 1558.0, 2614.0, 4113.0, 7081.0, 11535.0, 19185.0, 33461.0, 57909.0, 100157.0, 161772.0, 208330.0, 173416.0, 110378.0, 64576.0, 36757.0, 21404.0, 12731.0, 7497.0, 4664.0, 2830.0, 1668.0, 984.0, 656.0, 358.0, 213.0, 138.0, 69.0, 59.0, 37.0, 19.0, 12.0, 9.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6416015625, -0.6212921142578125, -0.600982666015625, -0.5806732177734375, -0.56036376953125, -0.5400543212890625, -0.519744873046875, -0.4994354248046875, -0.4791259765625, -0.4588165283203125, -0.438507080078125, -0.4181976318359375, -0.39788818359375, -0.3775787353515625, -0.357269287109375, -0.3369598388671875, -0.316650390625, -0.2963409423828125, -0.276031494140625, -0.2557220458984375, -0.23541259765625, -0.2151031494140625, -0.194793701171875, -0.1744842529296875, -0.1541748046875, -0.1338653564453125, -0.113555908203125, -0.0932464599609375, -0.07293701171875, -0.0526275634765625, -0.032318115234375, -0.0120086669921875, 0.00830078125, 0.0286102294921875, 0.048919677734375, 0.0692291259765625, 0.08953857421875, 0.1098480224609375, 0.130157470703125, 0.1504669189453125, 0.1707763671875, 0.1910858154296875, 0.211395263671875, 0.2317047119140625, 0.25201416015625, 0.2723236083984375, 0.292633056640625, 0.3129425048828125, 0.333251953125, 0.3535614013671875, 0.373870849609375, 0.3941802978515625, 0.41448974609375, 0.4347991943359375, 0.455108642578125, 0.4754180908203125, 0.4957275390625, 0.5160369873046875, 0.536346435546875, 0.5566558837890625, 0.57696533203125, 0.5972747802734375, 0.617584228515625, 0.6378936767578125, 0.658203125]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 4.0, 1.0, 6.0, 4.0, 6.0, 8.0, 4.0, 8.0, 12.0, 23.0, 15.0, 18.0, 18.0, 27.0, 25.0, 32.0, 17.0, 38.0, 36.0, 34.0, 32.0, 42.0, 23.0, 39.0, 1063.0, 38.0, 29.0, 51.0, 34.0, 35.0, 33.0, 31.0, 31.0, 30.0, 26.0, 24.0, 28.0, 8.0, 14.0, 16.0, 12.0, 12.0, 4.0, 13.0, 8.0, 6.0, 4.0, 1.0, 8.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.3671875, -3.26776123046875, -3.1683349609375, -3.06890869140625, -2.969482421875, -2.87005615234375, -2.7706298828125, -2.67120361328125, -2.57177734375, -2.47235107421875, -2.3729248046875, -2.27349853515625, -2.174072265625, -2.07464599609375, -1.9752197265625, -1.87579345703125, -1.7763671875, -1.67694091796875, -1.5775146484375, -1.47808837890625, -1.378662109375, -1.27923583984375, -1.1798095703125, -1.08038330078125, -0.98095703125, -0.88153076171875, -0.7821044921875, -0.68267822265625, -0.583251953125, -0.48382568359375, -0.3843994140625, -0.28497314453125, -0.185546875, -0.08612060546875, 0.0133056640625, 0.11273193359375, 0.212158203125, 0.31158447265625, 0.4110107421875, 0.51043701171875, 0.60986328125, 0.70928955078125, 0.8087158203125, 0.90814208984375, 1.007568359375, 1.10699462890625, 1.2064208984375, 1.30584716796875, 1.4052734375, 1.50469970703125, 1.6041259765625, 1.70355224609375, 1.802978515625, 1.90240478515625, 2.0018310546875, 2.10125732421875, 2.20068359375, 2.30010986328125, 2.3995361328125, 2.49896240234375, 2.598388671875, 2.69781494140625, 2.7972412109375, 2.89666748046875, 2.99609375]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 8.0, 2.0, 8.0, 13.0, 19.0, 34.0, 40.0, 67.0, 112.0, 182.0, 332.0, 508.0, 807.0, 1373.0, 2168.0, 3775.0, 5909.0, 9830.0, 16190.0, 26735.0, 43580.0, 70906.0, 110714.0, 155703.0, 1224796.0, 149971.0, 103778.0, 65905.0, 40903.0, 24510.0, 14910.0, 8999.0, 5554.0, 3455.0, 2085.0, 1244.0, 755.0, 479.0, 289.0, 182.0, 114.0, 72.0, 44.0, 27.0, 15.0, 12.0, 9.0, 4.0, 9.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.420166015625, -0.4067955017089844, -0.39342498779296875, -0.3800544738769531, -0.3666839599609375, -0.3533134460449219, -0.33994293212890625, -0.3265724182128906, -0.313201904296875, -0.2998313903808594, -0.28646087646484375, -0.2730903625488281, -0.2597198486328125, -0.24634933471679688, -0.23297882080078125, -0.21960830688476562, -0.20623779296875, -0.19286727905273438, -0.17949676513671875, -0.16612625122070312, -0.1527557373046875, -0.13938522338867188, -0.12601470947265625, -0.11264419555664062, -0.099273681640625, -0.08590316772460938, -0.07253265380859375, -0.059162139892578125, -0.0457916259765625, -0.032421112060546875, -0.01905059814453125, -0.005680084228515625, 0.0076904296875, 0.021060943603515625, 0.03443145751953125, 0.047801971435546875, 0.0611724853515625, 0.07454299926757812, 0.08791351318359375, 0.10128402709960938, 0.114654541015625, 0.12802505493164062, 0.14139556884765625, 0.15476608276367188, 0.1681365966796875, 0.18150711059570312, 0.19487762451171875, 0.20824813842773438, 0.22161865234375, 0.23498916625976562, 0.24835968017578125, 0.2617301940917969, 0.2751007080078125, 0.2884712219238281, 0.30184173583984375, 0.3152122497558594, 0.328582763671875, 0.3419532775878906, 0.35532379150390625, 0.3686943054199219, 0.3820648193359375, 0.3954353332519531, 0.40880584716796875, 0.4221763610839844, 0.435546875]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 3.0, 1.0, 4.0, 4.0, 3.0, 6.0, 5.0, 7.0, 4.0, 10.0, 11.0, 12.0, 19.0, 24.0, 29.0, 28.0, 46.0, 47.0, 50.0, 52.0, 64.0, 86.0, 74.0, 67.0, 52.0, 56.0, 35.0, 31.0, 25.0, 24.0, 27.0, 15.0, 15.0, 12.0, 7.0, 7.0, 5.0, 4.0, 6.0, 7.0, 8.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0], "bins": [-0.005229949951171875, -0.005082249641418457, -0.004934549331665039, -0.004786849021911621, -0.004639148712158203, -0.004491448402404785, -0.004343748092651367, -0.004196047782897949, -0.004048347473144531, -0.0039006471633911133, -0.0037529468536376953, -0.0036052465438842773, -0.0034575462341308594, -0.0033098459243774414, -0.0031621456146240234, -0.0030144453048706055, -0.0028667449951171875, -0.0027190446853637695, -0.0025713443756103516, -0.0024236440658569336, -0.0022759437561035156, -0.0021282434463500977, -0.0019805431365966797, -0.0018328428268432617, -0.0016851425170898438, -0.0015374422073364258, -0.0013897418975830078, -0.0012420415878295898, -0.0010943412780761719, -0.0009466409683227539, -0.0007989406585693359, -0.000651240348815918, -0.0005035400390625, -0.00035583972930908203, -0.00020813941955566406, -6.0439109802246094e-05, 8.726119995117188e-05, 0.00023496150970458984, 0.0003826618194580078, 0.0005303621292114258, 0.0006780624389648438, 0.0008257627487182617, 0.0009734630584716797, 0.0011211633682250977, 0.0012688636779785156, 0.0014165639877319336, 0.0015642642974853516, 0.0017119646072387695, 0.0018596649169921875, 0.0020073652267456055, 0.0021550655364990234, 0.0023027658462524414, 0.0024504661560058594, 0.0025981664657592773, 0.0027458667755126953, 0.0028935670852661133, 0.0030412673950195312, 0.0031889677047729492, 0.003336668014526367, 0.003484368324279785, 0.003632068634033203, 0.003779768943786621, 0.003927469253540039, 0.004075169563293457, 0.004222869873046875]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 6.0, 3.0, 2.0, 6.0, 10.0, 6.0, 3.0, 4.0, 11.0, 21.0, 29.0, 38.0, 55.0, 63.0, 71.0, 105.0, 182.0, 289.0, 599.0, 4284.0, 990878.0, 49860.0, 895.0, 413.0, 225.0, 143.0, 99.0, 70.0, 49.0, 35.0, 18.0, 18.0, 14.0, 4.0, 6.0, 6.0, 11.0, 2.0, 3.0, 4.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.09002685546875, -0.08699798583984375, -0.0839691162109375, -0.08094024658203125, -0.077911376953125, -0.07488250732421875, -0.0718536376953125, -0.06882476806640625, -0.0657958984375, -0.06276702880859375, -0.0597381591796875, -0.05670928955078125, -0.053680419921875, -0.05065155029296875, -0.0476226806640625, -0.04459381103515625, -0.04156494140625, -0.03853607177734375, -0.0355072021484375, -0.03247833251953125, -0.029449462890625, -0.02642059326171875, -0.0233917236328125, -0.02036285400390625, -0.017333984375, -0.01430511474609375, -0.0112762451171875, -0.00824737548828125, -0.005218505859375, -0.00218963623046875, 0.0008392333984375, 0.00386810302734375, 0.00689697265625, 0.00992584228515625, 0.0129547119140625, 0.01598358154296875, 0.019012451171875, 0.02204132080078125, 0.0250701904296875, 0.02809906005859375, 0.0311279296875, 0.03415679931640625, 0.0371856689453125, 0.04021453857421875, 0.043243408203125, 0.04627227783203125, 0.0493011474609375, 0.05233001708984375, 0.05535888671875, 0.05838775634765625, 0.0614166259765625, 0.06444549560546875, 0.067474365234375, 0.07050323486328125, 0.0735321044921875, 0.07656097412109375, 0.07958984375, 0.08261871337890625, 0.0856475830078125, 0.08867645263671875, 0.091705322265625, 0.09473419189453125, 0.0977630615234375, 0.10079193115234375, 0.10382080078125]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 7.0, 165.0, 762.0, 71.0, 9.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00869666412472725, -0.007854385301470757, -0.007012106012552977, -0.006169827189296484, -0.005327547900378704, -0.0044852690771222115, -0.003642990253865719, -0.002800710964947939, -0.0019584321416914463, -0.00111615308560431, -0.0002738741459324956, 0.0005684047937393188, 0.0014106838498264551, 0.0022529629059135914, 0.003095241729170084, 0.003937521018087864, 0.0047797998413443565, 0.005622078664600849, 0.006464357953518629, 0.007306636776775122, 0.008148916065692902, 0.008991194888949394, 0.009833473712205887, 0.01067575253546238, 0.011518031358718872, 0.012360310181975365, 0.013202589005231857, 0.01404486782848835, 0.014887147583067417, 0.015729427337646484, 0.016571704298257828, 0.01741398498415947, 0.018256263807415962, 0.019098542630672455, 0.019940821453928947, 0.02078310027718544, 0.021625379100441933, 0.022467657923698425, 0.023309938609600067, 0.02415221743285656, 0.024994496256113052, 0.025836775079369545, 0.026679053902626038, 0.02752133272588253, 0.028363611549139023, 0.029205892235040665, 0.030048169195652008, 0.03089044988155365, 0.03173272684216499, 0.032575007528066635, 0.03341728448867798, 0.03425956517457962, 0.035101842135190964, 0.035944122821092606, 0.03678639978170395, 0.03762868046760559, 0.03847096115350723, 0.039313241839408875, 0.04015551880002022, 0.04099779948592186, 0.0418400764465332, 0.042682357132434845, 0.04352463409304619, 0.04436691477894783, 0.045209191739559174]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 2.0, 2.0, 6.0, 4.0, 9.0, 13.0, 15.0, 23.0, 19.0, 32.0, 42.0, 43.0, 42.0, 53.0, 51.0, 64.0, 52.0, 47.0, 51.0, 56.0, 64.0, 36.0, 55.0, 41.0, 38.0, 25.0, 34.0, 21.0, 18.0, 12.0, 13.0, 7.0, 8.0, 2.0, 3.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004752993583679199, -0.004619834013283253, -0.004486674442887306, -0.00435351487249136, -0.004220355302095413, -0.004087195731699467, -0.00395403616130352, -0.0038208765909075737, -0.003687717020511627, -0.0035545574501156807, -0.003421397879719734, -0.0032882383093237877, -0.003155078738927841, -0.0030219191685318947, -0.002888759598135948, -0.0027556000277400017, -0.002622440457344055, -0.0024892808869481087, -0.002356121316552162, -0.0022229617461562157, -0.002089802175760269, -0.0019566426053643227, -0.0018234830349683762, -0.0016903234645724297, -0.0015571638941764832, -0.0014240043237805367, -0.0012908447533845901, -0.0011576851829886436, -0.0010245256125926971, -0.0008913660421967506, -0.0007582064718008041, -0.0006250469014048576, -0.0004918873310089111, -0.00035872776061296463, -0.00022556819021701813, -9.240861982107162e-05, 4.075095057487488e-05, 0.00017391052097082138, 0.0003070700913667679, 0.0004402296617627144, 0.0005733892321586609, 0.0007065488025546074, 0.0008397083729505539, 0.0009728679433465004, 0.001106027513742447, 0.0012391870841383934, 0.00137234665453434, 0.0015055062249302864, 0.001638665795326233, 0.0017718253657221794, 0.001904984936118126, 0.0020381445065140724, 0.002171304076910019, 0.0023044636473059654, 0.002437623217701912, 0.0025707827880978584, 0.002703942358493805, 0.0028371019288897514, 0.002970261499285698, 0.0031034210696816444, 0.003236580640077591, 0.0033697402104735374, 0.003502899780869484, 0.0036360593512654305, 0.003769218921661377]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 6.0, 7.0, 6.0, 9.0, 9.0, 11.0, 13.0, 11.0, 16.0, 17.0, 18.0, 27.0, 25.0, 35.0, 26.0, 29.0, 40.0, 23.0, 40.0, 34.0, 32.0, 35.0, 43.0, 34.0, 44.0, 24.0, 29.0, 36.0, 31.0, 43.0, 32.0, 18.0, 25.0, 20.0, 18.0, 25.0, 20.0, 12.0, 11.0, 13.0, 10.0, 9.0, 12.0, 6.0, 5.0, 8.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0], "bins": [-4.82421875, -4.66900634765625, -4.5137939453125, -4.35858154296875, -4.203369140625, -4.04815673828125, -3.8929443359375, -3.73773193359375, -3.58251953125, -3.42730712890625, -3.2720947265625, -3.11688232421875, -2.961669921875, -2.80645751953125, -2.6512451171875, -2.49603271484375, -2.3408203125, -2.18560791015625, -2.0303955078125, -1.87518310546875, -1.719970703125, -1.56475830078125, -1.4095458984375, -1.25433349609375, -1.09912109375, -0.94390869140625, -0.7886962890625, -0.63348388671875, -0.478271484375, -0.32305908203125, -0.1678466796875, -0.01263427734375, 0.142578125, 0.29779052734375, 0.4530029296875, 0.60821533203125, 0.763427734375, 0.91864013671875, 1.0738525390625, 1.22906494140625, 1.38427734375, 1.53948974609375, 1.6947021484375, 1.84991455078125, 2.005126953125, 2.16033935546875, 2.3155517578125, 2.47076416015625, 2.6259765625, 2.78118896484375, 2.9364013671875, 3.09161376953125, 3.246826171875, 3.40203857421875, 3.5572509765625, 3.71246337890625, 3.86767578125, 4.02288818359375, 4.1781005859375, 4.33331298828125, 4.488525390625, 4.64373779296875, 4.7989501953125, 4.95416259765625, 5.109375]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 9.0, 3.0, 2.0, 9.0, 11.0, 21.0, 37.0, 38.0, 54.0, 104.0, 178.0, 280.0, 424.0, 625.0, 1100.0, 1748.0, 2775.0, 4643.0, 8018.0, 13800.0, 25276.0, 52256.0, 147238.0, 443603.0, 209615.0, 66886.0, 30397.0, 16296.0, 9358.0, 5364.0, 3232.0, 1940.0, 1187.0, 749.0, 435.0, 314.0, 188.0, 127.0, 69.0, 48.0, 37.0, 29.0, 23.0, 13.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.580078125, -3.4669189453125, -3.353759765625, -3.2406005859375, -3.12744140625, -3.0142822265625, -2.901123046875, -2.7879638671875, -2.6748046875, -2.5616455078125, -2.448486328125, -2.3353271484375, -2.22216796875, -2.1090087890625, -1.995849609375, -1.8826904296875, -1.76953125, -1.6563720703125, -1.543212890625, -1.4300537109375, -1.31689453125, -1.2037353515625, -1.090576171875, -0.9774169921875, -0.8642578125, -0.7510986328125, -0.637939453125, -0.5247802734375, -0.41162109375, -0.2984619140625, -0.185302734375, -0.0721435546875, 0.041015625, 0.1541748046875, 0.267333984375, 0.3804931640625, 0.49365234375, 0.6068115234375, 0.719970703125, 0.8331298828125, 0.9462890625, 1.0594482421875, 1.172607421875, 1.2857666015625, 1.39892578125, 1.5120849609375, 1.625244140625, 1.7384033203125, 1.8515625, 1.9647216796875, 2.077880859375, 2.1910400390625, 2.30419921875, 2.4173583984375, 2.530517578125, 2.6436767578125, 2.7568359375, 2.8699951171875, 2.983154296875, 3.0963134765625, 3.20947265625, 3.3226318359375, 3.435791015625, 3.5489501953125, 3.662109375]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 7.0, 6.0, 4.0, 5.0, 7.0, 9.0, 10.0, 8.0, 19.0, 12.0, 18.0, 29.0, 29.0, 32.0, 29.0, 33.0, 49.0, 46.0, 64.0, 129.0, 1681.0, 304.0, 95.0, 58.0, 40.0, 46.0, 46.0, 32.0, 34.0, 29.0, 24.0, 31.0, 19.0, 17.0, 9.0, 16.0, 8.0, 3.0, 2.0, 6.0, 4.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.359375, -17.674560546875, -16.98974609375, -16.304931640625, -15.6201171875, -14.935302734375, -14.25048828125, -13.565673828125, -12.880859375, -12.196044921875, -11.51123046875, -10.826416015625, -10.1416015625, -9.456787109375, -8.77197265625, -8.087158203125, -7.40234375, -6.717529296875, -6.03271484375, -5.347900390625, -4.6630859375, -3.978271484375, -3.29345703125, -2.608642578125, -1.923828125, -1.239013671875, -0.55419921875, 0.130615234375, 0.8154296875, 1.500244140625, 2.18505859375, 2.869873046875, 3.5546875, 4.239501953125, 4.92431640625, 5.609130859375, 6.2939453125, 6.978759765625, 7.66357421875, 8.348388671875, 9.033203125, 9.718017578125, 10.40283203125, 11.087646484375, 11.7724609375, 12.457275390625, 13.14208984375, 13.826904296875, 14.51171875, 15.196533203125, 15.88134765625, 16.566162109375, 17.2509765625, 17.935791015625, 18.62060546875, 19.305419921875, 19.990234375, 20.675048828125, 21.35986328125, 22.044677734375, 22.7294921875, 23.414306640625, 24.09912109375, 24.783935546875, 25.46875]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 2.0, 6.0, 13.0, 12.0, 17.0, 18.0, 26.0, 43.0, 49.0, 63.0, 87.0, 108.0, 218.0, 401.0, 1089.0, 19032.0, 3106433.0, 16107.0, 973.0, 377.0, 210.0, 120.0, 85.0, 49.0, 37.0, 32.0, 23.0, 19.0, 18.0, 13.0, 9.0, 6.0, 1.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-67.1875, -65.39501953125, -63.6025390625, -61.81005859375, -60.017578125, -58.22509765625, -56.4326171875, -54.64013671875, -52.84765625, -51.05517578125, -49.2626953125, -47.47021484375, -45.677734375, -43.88525390625, -42.0927734375, -40.30029296875, -38.5078125, -36.71533203125, -34.9228515625, -33.13037109375, -31.337890625, -29.54541015625, -27.7529296875, -25.96044921875, -24.16796875, -22.37548828125, -20.5830078125, -18.79052734375, -16.998046875, -15.20556640625, -13.4130859375, -11.62060546875, -9.828125, -8.03564453125, -6.2431640625, -4.45068359375, -2.658203125, -0.86572265625, 0.9267578125, 2.71923828125, 4.51171875, 6.30419921875, 8.0966796875, 9.88916015625, 11.681640625, 13.47412109375, 15.2666015625, 17.05908203125, 18.8515625, 20.64404296875, 22.4365234375, 24.22900390625, 26.021484375, 27.81396484375, 29.6064453125, 31.39892578125, 33.19140625, 34.98388671875, 36.7763671875, 38.56884765625, 40.361328125, 42.15380859375, 43.9462890625, 45.73876953125, 47.53125]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 7.0, 2.0, 14.0, 35.0, 59.0, 101.0, 152.0, 187.0, 168.0, 145.0, 75.0, 40.0, 22.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.403079986572266, -46.38817596435547, -45.373268127441406, -44.35836410522461, -43.34346008300781, -42.32855224609375, -41.31364822387695, -40.298744201660156, -39.283836364746094, -38.2689323425293, -37.254024505615234, -36.23912048339844, -35.22421646118164, -34.209312438964844, -33.19440460205078, -32.179500579833984, -31.164596557617188, -30.149690628051758, -29.13478660583496, -28.11988067626953, -27.104976654052734, -26.090070724487305, -25.075164794921875, -24.060260772705078, -23.04535484313965, -22.03044891357422, -21.015544891357422, -20.000638961791992, -18.985733032226562, -17.970829010009766, -16.955923080444336, -15.941018104553223, -14.926109313964844, -13.91120433807373, -12.896299362182617, -11.881393432617188, -10.866488456726074, -9.851583480834961, -8.836677551269531, -7.821772575378418, -6.806867599487305, -5.791962623596191, -4.77705717086792, -3.7621519565582275, -2.747246742248535, -1.7323417663574219, -0.7174363136291504, 0.2974691390991211, 1.3123741149902344, 2.3272793292999268, 3.342184543609619, 4.357089996337891, 5.371994972229004, 6.386899948120117, 7.401805400848389, 8.41671085357666, 9.431615829467773, 10.446520805358887, 11.46142578125, 12.47633171081543, 13.491236686706543, 14.506141662597656, 15.521047592163086, 16.535953521728516, 17.550857543945312]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 3.0, 9.0, 4.0, 11.0, 6.0, 18.0, 15.0, 16.0, 24.0, 20.0, 25.0, 25.0, 25.0, 34.0, 40.0, 35.0, 35.0, 45.0, 24.0, 46.0, 43.0, 40.0, 36.0, 55.0, 29.0, 47.0, 35.0, 34.0, 27.0, 27.0, 21.0, 32.0, 16.0, 17.0, 8.0, 17.0, 15.0, 9.0, 6.0, 10.0, 5.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-49.996826171875, -48.29018783569336, -46.58354568481445, -44.87690734863281, -43.170265197753906, -41.463626861572266, -39.756988525390625, -38.05034637451172, -36.34370803833008, -34.63706970214844, -32.93042755126953, -31.22378921508789, -29.517148971557617, -27.810508728027344, -26.10386848449707, -24.397228240966797, -22.690587997436523, -20.98394775390625, -19.277307510375977, -17.570667266845703, -15.864028930664062, -14.157388687133789, -12.450748443603516, -10.744109153747559, -9.037468910217285, -7.33082914352417, -5.624189376831055, -3.9175491333007812, -2.210909366607666, -0.5042695999145508, 1.2023706436157227, 2.9090099334716797, 4.615650177001953, 6.322289943695068, 8.028929710388184, 9.735569953918457, 11.442209243774414, 13.148849487304688, 14.855489730834961, 16.562129974365234, 18.268768310546875, 19.97540855407715, 21.682048797607422, 23.388687133789062, 25.095327377319336, 26.80196762084961, 28.508607864379883, 30.215248107910156, 31.92188835144043, 33.6285285949707, 35.335166931152344, 37.04180908203125, 38.74844741821289, 40.45508575439453, 42.16172790527344, 43.86836624145508, 45.575008392333984, 47.281646728515625, 48.98828887939453, 50.69492721557617, 52.40156936645508, 54.10820770263672, 55.814849853515625, 57.521488189697266, 59.228126525878906]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 4.0, 5.0, 13.0, 10.0, 7.0, 8.0, 11.0, 16.0, 9.0, 15.0, 20.0, 26.0, 41.0, 30.0, 34.0, 33.0, 26.0, 23.0, 32.0, 35.0, 33.0, 49.0, 39.0, 39.0, 38.0, 27.0, 36.0, 32.0, 32.0, 35.0, 26.0, 28.0, 23.0, 20.0, 25.0, 18.0, 9.0, 19.0, 13.0, 14.0, 8.0, 10.0, 7.0, 6.0, 3.0, 8.0, 5.0, 3.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.92578125, -4.7607421875, -4.595703125, -4.4306640625, -4.265625, -4.1005859375, -3.935546875, -3.7705078125, -3.60546875, -3.4404296875, -3.275390625, -3.1103515625, -2.9453125, -2.7802734375, -2.615234375, -2.4501953125, -2.28515625, -2.1201171875, -1.955078125, -1.7900390625, -1.625, -1.4599609375, -1.294921875, -1.1298828125, -0.96484375, -0.7998046875, -0.634765625, -0.4697265625, -0.3046875, -0.1396484375, 0.025390625, 0.1904296875, 0.35546875, 0.5205078125, 0.685546875, 0.8505859375, 1.015625, 1.1806640625, 1.345703125, 1.5107421875, 1.67578125, 1.8408203125, 2.005859375, 2.1708984375, 2.3359375, 2.5009765625, 2.666015625, 2.8310546875, 2.99609375, 3.1611328125, 3.326171875, 3.4912109375, 3.65625, 3.8212890625, 3.986328125, 4.1513671875, 4.31640625, 4.4814453125, 4.646484375, 4.8115234375, 4.9765625, 5.1416015625, 5.306640625, 5.4716796875, 5.63671875]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 7.0, 4.0, 12.0, 14.0, 14.0, 19.0, 31.0, 64.0, 59.0, 100.0, 154.0, 215.0, 326.0, 573.0, 1010.0, 1970.0, 4168.0, 10138.0, 30960.0, 128332.0, 675938.0, 1841519.0, 1180792.0, 241944.0, 49560.0, 14997.0, 5709.0, 2466.0, 1262.0, 699.0, 384.0, 255.0, 172.0, 120.0, 82.0, 47.0, 33.0, 29.0, 29.0, 23.0, 19.0, 13.0, 8.0, 7.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-9.171875, -8.891357421875, -8.61083984375, -8.330322265625, -8.0498046875, -7.769287109375, -7.48876953125, -7.208251953125, -6.927734375, -6.647216796875, -6.36669921875, -6.086181640625, -5.8056640625, -5.525146484375, -5.24462890625, -4.964111328125, -4.68359375, -4.403076171875, -4.12255859375, -3.842041015625, -3.5615234375, -3.281005859375, -3.00048828125, -2.719970703125, -2.439453125, -2.158935546875, -1.87841796875, -1.597900390625, -1.3173828125, -1.036865234375, -0.75634765625, -0.475830078125, -0.1953125, 0.085205078125, 0.36572265625, 0.646240234375, 0.9267578125, 1.207275390625, 1.48779296875, 1.768310546875, 2.048828125, 2.329345703125, 2.60986328125, 2.890380859375, 3.1708984375, 3.451416015625, 3.73193359375, 4.012451171875, 4.29296875, 4.573486328125, 4.85400390625, 5.134521484375, 5.4150390625, 5.695556640625, 5.97607421875, 6.256591796875, 6.537109375, 6.817626953125, 7.09814453125, 7.378662109375, 7.6591796875, 7.939697265625, 8.22021484375, 8.500732421875, 8.78125]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 6.0, 7.0, 6.0, 10.0, 20.0, 16.0, 18.0, 23.0, 23.0, 54.0, 60.0, 78.0, 106.0, 144.0, 200.0, 216.0, 338.0, 386.0, 412.0, 431.0, 328.0, 311.0, 188.0, 176.0, 128.0, 103.0, 66.0, 59.0, 28.0, 43.0, 30.0, 19.0, 11.0, 11.0, 11.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.3515625, -9.979736328125, -9.60791015625, -9.236083984375, -8.8642578125, -8.492431640625, -8.12060546875, -7.748779296875, -7.376953125, -7.005126953125, -6.63330078125, -6.261474609375, -5.8896484375, -5.517822265625, -5.14599609375, -4.774169921875, -4.40234375, -4.030517578125, -3.65869140625, -3.286865234375, -2.9150390625, -2.543212890625, -2.17138671875, -1.799560546875, -1.427734375, -1.055908203125, -0.68408203125, -0.312255859375, 0.0595703125, 0.431396484375, 0.80322265625, 1.175048828125, 1.546875, 1.918701171875, 2.29052734375, 2.662353515625, 3.0341796875, 3.406005859375, 3.77783203125, 4.149658203125, 4.521484375, 4.893310546875, 5.26513671875, 5.636962890625, 6.0087890625, 6.380615234375, 6.75244140625, 7.124267578125, 7.49609375, 7.867919921875, 8.23974609375, 8.611572265625, 8.9833984375, 9.355224609375, 9.72705078125, 10.098876953125, 10.470703125, 10.842529296875, 11.21435546875, 11.586181640625, 11.9580078125, 12.329833984375, 12.70166015625, 13.073486328125, 13.4453125]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 8.0, 2.0, 2.0, 12.0, 9.0, 6.0, 15.0, 18.0, 19.0, 23.0, 27.0, 47.0, 68.0, 71.0, 100.0, 146.0, 214.0, 393.0, 1128.0, 5364.0, 91694.0, 3452386.0, 621605.0, 17212.0, 2115.0, 573.0, 311.0, 182.0, 106.0, 102.0, 66.0, 69.0, 45.0, 34.0, 26.0, 18.0, 13.0, 10.0, 13.0, 8.0, 7.0, 6.0, 6.0, 7.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0], "bins": [-40.15625, -39.03271484375, -37.9091796875, -36.78564453125, -35.662109375, -34.53857421875, -33.4150390625, -32.29150390625, -31.16796875, -30.04443359375, -28.9208984375, -27.79736328125, -26.673828125, -25.55029296875, -24.4267578125, -23.30322265625, -22.1796875, -21.05615234375, -19.9326171875, -18.80908203125, -17.685546875, -16.56201171875, -15.4384765625, -14.31494140625, -13.19140625, -12.06787109375, -10.9443359375, -9.82080078125, -8.697265625, -7.57373046875, -6.4501953125, -5.32666015625, -4.203125, -3.07958984375, -1.9560546875, -0.83251953125, 0.291015625, 1.41455078125, 2.5380859375, 3.66162109375, 4.78515625, 5.90869140625, 7.0322265625, 8.15576171875, 9.279296875, 10.40283203125, 11.5263671875, 12.64990234375, 13.7734375, 14.89697265625, 16.0205078125, 17.14404296875, 18.267578125, 19.39111328125, 20.5146484375, 21.63818359375, 22.76171875, 23.88525390625, 25.0087890625, 26.13232421875, 27.255859375, 28.37939453125, 29.5029296875, 30.62646484375, 31.75]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 8.0, 18.0, 25.0, 42.0, 107.0, 138.0, 162.0, 192.0, 132.0, 92.0, 50.0, 27.0, 15.0, 7.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-94.44627380371094, -91.58157348632812, -88.71688079833984, -85.85218048095703, -82.98748779296875, -80.12278747558594, -77.25808715820312, -74.39339447021484, -71.52870178222656, -68.66400146484375, -65.79930877685547, -62.934608459472656, -60.069915771484375, -57.20521545410156, -54.340518951416016, -51.47582244873047, -48.611122131347656, -45.74642562866211, -42.88172912597656, -40.01702880859375, -37.15233612060547, -34.287635803222656, -31.42293930053711, -28.558242797851562, -25.693546295166016, -22.82884979248047, -19.964153289794922, -17.099454879760742, -14.234758377075195, -11.370061874389648, -8.505363464355469, -5.640666961669922, -2.7759628295898438, 0.08873414993286133, 2.9534311294555664, 5.81812858581543, 8.682825088500977, 11.547521591186523, 14.412220001220703, 17.27691650390625, 20.141613006591797, 23.006309509277344, 25.87100601196289, 28.73570442199707, 31.600400924682617, 34.46509552001953, 37.329795837402344, 40.19449234008789, 43.05918884277344, 45.923885345458984, 48.78858184814453, 51.653282165527344, 54.517974853515625, 57.38267517089844, 60.247371673583984, 63.11206817626953, 65.97676086425781, 68.84146118164062, 71.7061538696289, 74.57085418701172, 77.435546875, 80.30024719238281, 83.16494750976562, 86.0296401977539, 88.89434051513672]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 5.0, 3.0, 6.0, 12.0, 7.0, 6.0, 13.0, 14.0, 17.0, 18.0, 22.0, 34.0, 31.0, 25.0, 37.0, 32.0, 38.0, 35.0, 54.0, 35.0, 50.0, 43.0, 32.0, 28.0, 33.0, 39.0, 38.0, 34.0, 31.0, 38.0, 22.0, 23.0, 27.0, 13.0, 17.0, 22.0, 13.0, 12.0, 15.0, 14.0, 7.0, 3.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 4.0], "bins": [-44.685394287109375, -43.43315124511719, -42.180912017822266, -40.92866897583008, -39.676429748535156, -38.42418670654297, -37.17194366455078, -35.91970443725586, -34.66746139526367, -33.415218353271484, -32.16297912597656, -30.910736083984375, -29.65849494934082, -28.406253814697266, -27.15401268005371, -25.901771545410156, -24.6495304107666, -23.397289276123047, -22.145048141479492, -20.892807006835938, -19.64056396484375, -18.388322830200195, -17.13608169555664, -15.88383960723877, -14.631598472595215, -13.37935733795166, -12.127115249633789, -10.874874114990234, -9.62263298034668, -8.370390892028809, -7.118149757385254, -5.865907669067383, -4.613666534423828, -3.3614249229431152, -2.1091835498809814, -0.8569421768188477, 0.39529943466186523, 1.6475410461425781, 2.899782180786133, 4.152024269104004, 5.404265403747559, 6.6565070152282715, 7.908748626708984, 9.160989761352539, 10.413230895996094, 11.665472984313965, 12.91771411895752, 14.16995620727539, 15.422197341918945, 16.6744384765625, 17.926679611206055, 19.17892074584961, 20.431163787841797, 21.68340492248535, 22.935646057128906, 24.187889099121094, 25.440128326416016, 26.69236946105957, 27.944610595703125, 29.196853637695312, 30.449094772338867, 31.701335906982422, 32.953575134277344, 34.20581817626953, 35.45806121826172]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 4.0, 6.0, 6.0, 9.0, 10.0, 13.0, 14.0, 22.0, 20.0, 24.0, 30.0, 25.0, 23.0, 40.0, 30.0, 39.0, 31.0, 48.0, 37.0, 57.0, 48.0, 39.0, 37.0, 26.0, 48.0, 31.0, 38.0, 35.0, 34.0, 30.0, 28.0, 22.0, 17.0, 12.0, 13.0, 16.0, 11.0, 8.0, 6.0, 4.0, 6.0, 5.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.50390625, -5.31805419921875, -5.1322021484375, -4.94635009765625, -4.760498046875, -4.57464599609375, -4.3887939453125, -4.20294189453125, -4.01708984375, -3.83123779296875, -3.6453857421875, -3.45953369140625, -3.273681640625, -3.08782958984375, -2.9019775390625, -2.71612548828125, -2.5302734375, -2.34442138671875, -2.1585693359375, -1.97271728515625, -1.786865234375, -1.60101318359375, -1.4151611328125, -1.22930908203125, -1.04345703125, -0.85760498046875, -0.6717529296875, -0.48590087890625, -0.300048828125, -0.11419677734375, 0.0716552734375, 0.25750732421875, 0.443359375, 0.62921142578125, 0.8150634765625, 1.00091552734375, 1.186767578125, 1.37261962890625, 1.5584716796875, 1.74432373046875, 1.93017578125, 2.11602783203125, 2.3018798828125, 2.48773193359375, 2.673583984375, 2.85943603515625, 3.0452880859375, 3.23114013671875, 3.4169921875, 3.60284423828125, 3.7886962890625, 3.97454833984375, 4.160400390625, 4.34625244140625, 4.5321044921875, 4.71795654296875, 4.90380859375, 5.08966064453125, 5.2755126953125, 5.46136474609375, 5.647216796875, 5.83306884765625, 6.0189208984375, 6.20477294921875, 6.390625]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 7.0, 3.0, 9.0, 9.0, 8.0, 28.0, 39.0, 65.0, 88.0, 137.0, 193.0, 336.0, 483.0, 722.0, 1060.0, 1651.0, 2494.0, 3855.0, 6064.0, 9302.0, 14522.0, 23202.0, 35901.0, 56899.0, 88645.0, 132188.0, 173355.0, 163855.0, 118451.0, 77679.0, 49606.0, 31397.0, 20249.0, 12904.0, 8124.0, 5314.0, 3309.0, 2267.0, 1438.0, 892.0, 593.0, 429.0, 259.0, 184.0, 115.0, 70.0, 52.0, 36.0, 35.0, 18.0, 13.0, 9.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.5703125, -0.5524063110351562, -0.5345001220703125, -0.5165939331054688, -0.498687744140625, -0.48078155517578125, -0.4628753662109375, -0.44496917724609375, -0.42706298828125, -0.40915679931640625, -0.3912506103515625, -0.37334442138671875, -0.355438232421875, -0.33753204345703125, -0.3196258544921875, -0.30171966552734375, -0.2838134765625, -0.26590728759765625, -0.2480010986328125, -0.23009490966796875, -0.212188720703125, -0.19428253173828125, -0.1763763427734375, -0.15847015380859375, -0.14056396484375, -0.12265777587890625, -0.1047515869140625, -0.08684539794921875, -0.068939208984375, -0.05103302001953125, -0.0331268310546875, -0.01522064208984375, 0.002685546875, 0.02059173583984375, 0.0384979248046875, 0.05640411376953125, 0.074310302734375, 0.09221649169921875, 0.1101226806640625, 0.12802886962890625, 0.14593505859375, 0.16384124755859375, 0.1817474365234375, 0.19965362548828125, 0.217559814453125, 0.23546600341796875, 0.2533721923828125, 0.27127838134765625, 0.2891845703125, 0.30709075927734375, 0.3249969482421875, 0.34290313720703125, 0.360809326171875, 0.37871551513671875, 0.3966217041015625, 0.41452789306640625, 0.43243408203125, 0.45034027099609375, 0.4682464599609375, 0.48615264892578125, 0.504058837890625, 0.5219650268554688, 0.5398712158203125, 0.5577774047851562, 0.57568359375]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 8.0, 4.0, 5.0, 5.0, 7.0, 13.0, 15.0, 11.0, 25.0, 27.0, 36.0, 37.0, 24.0, 48.0, 42.0, 48.0, 41.0, 35.0, 48.0, 1074.0, 44.0, 55.0, 45.0, 52.0, 35.0, 43.0, 31.0, 35.0, 23.0, 17.0, 17.0, 17.0, 18.0, 16.0, 8.0, 6.0, 4.0, 5.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.91015625, -3.7744140625, -3.638671875, -3.5029296875, -3.3671875, -3.2314453125, -3.095703125, -2.9599609375, -2.82421875, -2.6884765625, -2.552734375, -2.4169921875, -2.28125, -2.1455078125, -2.009765625, -1.8740234375, -1.73828125, -1.6025390625, -1.466796875, -1.3310546875, -1.1953125, -1.0595703125, -0.923828125, -0.7880859375, -0.65234375, -0.5166015625, -0.380859375, -0.2451171875, -0.109375, 0.0263671875, 0.162109375, 0.2978515625, 0.43359375, 0.5693359375, 0.705078125, 0.8408203125, 0.9765625, 1.1123046875, 1.248046875, 1.3837890625, 1.51953125, 1.6552734375, 1.791015625, 1.9267578125, 2.0625, 2.1982421875, 2.333984375, 2.4697265625, 2.60546875, 2.7412109375, 2.876953125, 3.0126953125, 3.1484375, 3.2841796875, 3.419921875, 3.5556640625, 3.69140625, 3.8271484375, 3.962890625, 4.0986328125, 4.234375, 4.3701171875, 4.505859375, 4.6416015625, 4.77734375]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 4.0, 14.0, 15.0, 23.0, 34.0, 49.0, 82.0, 162.0, 212.0, 396.0, 646.0, 1139.0, 1927.0, 3183.0, 5130.0, 8602.0, 14507.0, 24499.0, 40960.0, 67843.0, 108318.0, 156442.0, 1229716.0, 156428.0, 107360.0, 67558.0, 40941.0, 24308.0, 14851.0, 8730.0, 5288.0, 3131.0, 1861.0, 1128.0, 712.0, 358.0, 234.0, 162.0, 71.0, 37.0, 24.0, 12.0, 18.0, 3.0, 7.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.492919921875, -0.47820281982421875, -0.4634857177734375, -0.44876861572265625, -0.434051513671875, -0.41933441162109375, -0.4046173095703125, -0.38990020751953125, -0.37518310546875, -0.36046600341796875, -0.3457489013671875, -0.33103179931640625, -0.316314697265625, -0.30159759521484375, -0.2868804931640625, -0.27216339111328125, -0.2574462890625, -0.24272918701171875, -0.2280120849609375, -0.21329498291015625, -0.198577880859375, -0.18386077880859375, -0.1691436767578125, -0.15442657470703125, -0.13970947265625, -0.12499237060546875, -0.1102752685546875, -0.09555816650390625, -0.080841064453125, -0.06612396240234375, -0.0514068603515625, -0.03668975830078125, -0.02197265625, -0.00725555419921875, 0.0074615478515625, 0.02217864990234375, 0.036895751953125, 0.05161285400390625, 0.0663299560546875, 0.08104705810546875, 0.09576416015625, 0.11048126220703125, 0.1251983642578125, 0.13991546630859375, 0.154632568359375, 0.16934967041015625, 0.1840667724609375, 0.19878387451171875, 0.2135009765625, 0.22821807861328125, 0.2429351806640625, 0.25765228271484375, 0.272369384765625, 0.28708648681640625, 0.3018035888671875, 0.31652069091796875, 0.33123779296875, 0.34595489501953125, 0.3606719970703125, 0.37538909912109375, 0.390106201171875, 0.40482330322265625, 0.4195404052734375, 0.43425750732421875, 0.448974609375]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 4.0, 13.0, 6.0, 11.0, 20.0, 25.0, 29.0, 39.0, 44.0, 64.0, 81.0, 89.0, 90.0, 98.0, 76.0, 75.0, 58.0, 37.0, 26.0, 27.0, 17.0, 15.0, 9.0, 11.0, 7.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.006439208984375, -0.0062631964683532715, -0.006087183952331543, -0.0059111714363098145, -0.005735158920288086, -0.005559146404266357, -0.005383133888244629, -0.0052071213722229, -0.005031108856201172, -0.004855096340179443, -0.004679083824157715, -0.004503071308135986, -0.004327058792114258, -0.004151046276092529, -0.003975033760070801, -0.0037990212440490723, -0.0036230087280273438, -0.0034469962120056152, -0.0032709836959838867, -0.003094971179962158, -0.0029189586639404297, -0.002742946147918701, -0.0025669336318969727, -0.002390921115875244, -0.0022149085998535156, -0.002038896083831787, -0.0018628835678100586, -0.00168687105178833, -0.0015108585357666016, -0.001334846019744873, -0.0011588335037231445, -0.000982820987701416, -0.0008068084716796875, -0.000630795955657959, -0.00045478343963623047, -0.00027877092361450195, -0.00010275840759277344, 7.325410842895508e-05, 0.0002492666244506836, 0.0004252791404724121, 0.0006012916564941406, 0.0007773041725158691, 0.0009533166885375977, 0.0011293292045593262, 0.0013053417205810547, 0.0014813542366027832, 0.0016573667526245117, 0.0018333792686462402, 0.0020093917846679688, 0.0021854043006896973, 0.0023614168167114258, 0.0025374293327331543, 0.002713441848754883, 0.0028894543647766113, 0.00306546688079834, 0.0032414793968200684, 0.003417491912841797, 0.0035935044288635254, 0.003769516944885254, 0.003945529460906982, 0.004121541976928711, 0.0042975544929504395, 0.004473567008972168, 0.0046495795249938965, 0.004825592041015625]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 1.0, 8.0, 11.0, 15.0, 16.0, 36.0, 53.0, 76.0, 133.0, 225.0, 501.0, 2850.0, 1018335.0, 24836.0, 750.0, 289.0, 144.0, 97.0, 50.0, 40.0, 18.0, 15.0, 9.0, 12.0, 8.0, 4.0, 2.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10888671875, -0.10495376586914062, -0.10102081298828125, -0.09708786010742188, -0.0931549072265625, -0.08922195434570312, -0.08528900146484375, -0.08135604858398438, -0.077423095703125, -0.07349014282226562, -0.06955718994140625, -0.06562423706054688, -0.0616912841796875, -0.057758331298828125, -0.05382537841796875, -0.049892425537109375, -0.04595947265625, -0.042026519775390625, -0.03809356689453125, -0.034160614013671875, -0.0302276611328125, -0.026294708251953125, -0.02236175537109375, -0.018428802490234375, -0.014495849609375, -0.010562896728515625, -0.00662994384765625, -0.002696990966796875, 0.0012359619140625, 0.005168914794921875, 0.00910186767578125, 0.013034820556640625, 0.0169677734375, 0.020900726318359375, 0.02483367919921875, 0.028766632080078125, 0.0326995849609375, 0.036632537841796875, 0.04056549072265625, 0.044498443603515625, 0.048431396484375, 0.052364349365234375, 0.05629730224609375, 0.060230255126953125, 0.0641632080078125, 0.06809616088867188, 0.07202911376953125, 0.07596206665039062, 0.07989501953125, 0.08382797241210938, 0.08776092529296875, 0.09169387817382812, 0.0956268310546875, 0.09955978393554688, 0.10349273681640625, 0.10742568969726562, 0.111358642578125, 0.11529159545898438, 0.11922454833984375, 0.12315750122070312, 0.1270904541015625, 0.13102340698242188, 0.13495635986328125, 0.13888931274414062, 0.142822265625]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [4.0, 48.0, 807.0, 148.0, 10.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0026813577860593796, -0.0016594692133367062, -0.0006375806406140327, 0.00038430793210864067, 0.001406196504831314, 0.0024280850775539875, 0.003449973650276661, 0.004471862222999334, 0.005493750795722008, 0.006515639368444681, 0.007537527941167355, 0.008559416979551315, 0.009581305086612701, 0.010603193193674088, 0.011625082232058048, 0.012646971270442009, 0.013668859377503395, 0.014690747484564781, 0.015712637454271317, 0.016734525561332703, 0.01775641366839409, 0.018778301775455475, 0.01980018988251686, 0.020822079852223396, 0.021843967959284782, 0.02286585606634617, 0.023887746036052704, 0.02490963414311409, 0.025931522250175476, 0.026953410357236862, 0.02797529846429825, 0.028997188434004784, 0.03001907467842102, 0.031040962785482407, 0.03206285089254379, 0.03308473899960518, 0.034106627106666565, 0.03512851893901825, 0.036150407046079636, 0.03717229515314102, 0.03819418326020241, 0.039216071367263794, 0.04023795947432518, 0.041259847581386566, 0.04228173941373825, 0.04330362752079964, 0.04432551562786102, 0.04534740373492241, 0.046369291841983795, 0.04739117994904518, 0.04841306805610657, 0.049434956163167953, 0.05045684427022934, 0.051478736102581024, 0.05250062420964241, 0.053522512316703796, 0.05454440042376518, 0.05556628853082657, 0.056588176637887955, 0.05761006474494934, 0.058631956577301025, 0.05965384468436241, 0.0606757327914238, 0.061697620898485184, 0.06271950900554657]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 10.0, 7.0, 10.0, 15.0, 24.0, 26.0, 24.0, 30.0, 45.0, 42.0, 46.0, 74.0, 80.0, 68.0, 63.0, 69.0, 63.0, 50.0, 46.0, 51.0, 29.0, 28.0, 29.0, 23.0, 16.0, 10.0, 13.0, 7.0, 3.0, 4.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00514751672744751, -0.005015549249947071, -0.004883581772446632, -0.004751614294946194, -0.004619646817445755, -0.004487679339945316, -0.004355711862444878, -0.004223744384944439, -0.004091776907444, -0.0039598094299435616, -0.003827841952443123, -0.003695874474942684, -0.0035639069974422455, -0.003431939519941807, -0.003299972042441368, -0.0031680045649409294, -0.0030360370874404907, -0.002904069609940052, -0.0027721021324396133, -0.0026401346549391747, -0.002508167177438736, -0.0023761996999382973, -0.0022442322224378586, -0.00211226474493742, -0.001980297267436981, -0.0018483297899365425, -0.0017163623124361038, -0.0015843948349356651, -0.0014524273574352264, -0.0013204598799347878, -0.001188492402434349, -0.0010565249249339104, -0.0009245574474334717, -0.000792589969933033, -0.0006606224924325943, -0.0005286550149321556, -0.0003966875374317169, -0.00026472005993127823, -0.00013275258243083954, -7.851049304008484e-07, 0.00013118237257003784, 0.00026314985007047653, 0.0003951173275709152, 0.0005270848050713539, 0.0006590522825717926, 0.0007910197600722313, 0.00092298723757267, 0.0010549547150731087, 0.0011869221925735474, 0.001318889670073986, 0.0014508571475744247, 0.0015828246250748634, 0.0017147921025753021, 0.0018467595800757408, 0.0019787270575761795, 0.002110694535076618, 0.002242662012577057, 0.0023746294900774956, 0.0025065969675779343, 0.002638564445078373, 0.0027705319225788116, 0.0029024994000792503, 0.003034466877579689, 0.0031664343550801277, 0.0032984018325805664]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 4.0, 6.0, 6.0, 9.0, 10.0, 13.0, 14.0, 22.0, 20.0, 24.0, 30.0, 25.0, 23.0, 40.0, 30.0, 39.0, 31.0, 48.0, 37.0, 57.0, 48.0, 39.0, 37.0, 27.0, 47.0, 31.0, 38.0, 35.0, 34.0, 30.0, 28.0, 22.0, 17.0, 12.0, 13.0, 16.0, 11.0, 8.0, 6.0, 4.0, 6.0, 5.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.50390625, -5.31805419921875, -5.1322021484375, -4.94635009765625, -4.760498046875, -4.57464599609375, -4.3887939453125, -4.20294189453125, -4.01708984375, -3.83123779296875, -3.6453857421875, -3.45953369140625, -3.273681640625, -3.08782958984375, -2.9019775390625, -2.71612548828125, -2.5302734375, -2.34442138671875, -2.1585693359375, -1.97271728515625, -1.786865234375, -1.60101318359375, -1.4151611328125, -1.22930908203125, -1.04345703125, -0.85760498046875, -0.6717529296875, -0.48590087890625, -0.300048828125, -0.11419677734375, 0.0716552734375, 0.25750732421875, 0.443359375, 0.62921142578125, 0.8150634765625, 1.00091552734375, 1.186767578125, 1.37261962890625, 1.5584716796875, 1.74432373046875, 1.93017578125, 2.11602783203125, 2.3018798828125, 2.48773193359375, 2.673583984375, 2.85943603515625, 3.0452880859375, 3.23114013671875, 3.4169921875, 3.60284423828125, 3.7886962890625, 3.97454833984375, 4.160400390625, 4.34625244140625, 4.5321044921875, 4.71795654296875, 4.90380859375, 5.08966064453125, 5.2755126953125, 5.46136474609375, 5.647216796875, 5.83306884765625, 6.0189208984375, 6.20477294921875, 6.390625]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 9.0, 14.0, 15.0, 27.0, 34.0, 77.0, 117.0, 209.0, 289.0, 513.0, 922.0, 1688.0, 3437.0, 7373.0, 16888.0, 39932.0, 100964.0, 305161.0, 366589.0, 121406.0, 46459.0, 19404.0, 8679.0, 3902.0, 1952.0, 1035.0, 575.0, 327.0, 175.0, 123.0, 96.0, 63.0, 36.0, 24.0, 16.0, 8.0, 7.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.875, -4.72308349609375, -4.5711669921875, -4.41925048828125, -4.267333984375, -4.11541748046875, -3.9635009765625, -3.81158447265625, -3.65966796875, -3.50775146484375, -3.3558349609375, -3.20391845703125, -3.052001953125, -2.90008544921875, -2.7481689453125, -2.59625244140625, -2.4443359375, -2.29241943359375, -2.1405029296875, -1.98858642578125, -1.836669921875, -1.68475341796875, -1.5328369140625, -1.38092041015625, -1.22900390625, -1.07708740234375, -0.9251708984375, -0.77325439453125, -0.621337890625, -0.46942138671875, -0.3175048828125, -0.16558837890625, -0.013671875, 0.13824462890625, 0.2901611328125, 0.44207763671875, 0.593994140625, 0.74591064453125, 0.8978271484375, 1.04974365234375, 1.20166015625, 1.35357666015625, 1.5054931640625, 1.65740966796875, 1.809326171875, 1.96124267578125, 2.1131591796875, 2.26507568359375, 2.4169921875, 2.56890869140625, 2.7208251953125, 2.87274169921875, 3.024658203125, 3.17657470703125, 3.3284912109375, 3.48040771484375, 3.63232421875, 3.78424072265625, 3.9361572265625, 4.08807373046875, 4.239990234375, 4.39190673828125, 4.5438232421875, 4.69573974609375, 4.84765625]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 0.0, 3.0, 5.0, 0.0, 4.0, 8.0, 6.0, 8.0, 12.0, 16.0, 25.0, 27.0, 18.0, 33.0, 27.0, 36.0, 30.0, 64.0, 58.0, 94.0, 168.0, 1645.0, 269.0, 90.0, 60.0, 47.0, 49.0, 40.0, 29.0, 32.0, 31.0, 17.0, 25.0, 12.0, 14.0, 6.0, 13.0, 11.0, 9.0, 5.0, 6.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-26.34375, -25.584228515625, -24.82470703125, -24.065185546875, -23.3056640625, -22.546142578125, -21.78662109375, -21.027099609375, -20.267578125, -19.508056640625, -18.74853515625, -17.989013671875, -17.2294921875, -16.469970703125, -15.71044921875, -14.950927734375, -14.19140625, -13.431884765625, -12.67236328125, -11.912841796875, -11.1533203125, -10.393798828125, -9.63427734375, -8.874755859375, -8.115234375, -7.355712890625, -6.59619140625, -5.836669921875, -5.0771484375, -4.317626953125, -3.55810546875, -2.798583984375, -2.0390625, -1.279541015625, -0.52001953125, 0.239501953125, 0.9990234375, 1.758544921875, 2.51806640625, 3.277587890625, 4.037109375, 4.796630859375, 5.55615234375, 6.315673828125, 7.0751953125, 7.834716796875, 8.59423828125, 9.353759765625, 10.11328125, 10.872802734375, 11.63232421875, 12.391845703125, 13.1513671875, 13.910888671875, 14.67041015625, 15.429931640625, 16.189453125, 16.948974609375, 17.70849609375, 18.468017578125, 19.2275390625, 19.987060546875, 20.74658203125, 21.506103515625, 22.265625]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 4.0, 4.0, 7.0, 8.0, 14.0, 19.0, 13.0, 15.0, 15.0, 45.0, 38.0, 65.0, 67.0, 109.0, 128.0, 209.0, 261.0, 480.0, 2146.0, 231901.0, 2903542.0, 4781.0, 721.0, 331.0, 213.0, 165.0, 88.0, 67.0, 63.0, 32.0, 41.0, 33.0, 20.0, 22.0, 10.0, 8.0, 8.0, 3.0, 6.0, 1.0, 3.0, 3.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.78125, -48.0732421875, -46.365234375, -44.6572265625, -42.94921875, -41.2412109375, -39.533203125, -37.8251953125, -36.1171875, -34.4091796875, -32.701171875, -30.9931640625, -29.28515625, -27.5771484375, -25.869140625, -24.1611328125, -22.453125, -20.7451171875, -19.037109375, -17.3291015625, -15.62109375, -13.9130859375, -12.205078125, -10.4970703125, -8.7890625, -7.0810546875, -5.373046875, -3.6650390625, -1.95703125, -0.2490234375, 1.458984375, 3.1669921875, 4.875, 6.5830078125, 8.291015625, 9.9990234375, 11.70703125, 13.4150390625, 15.123046875, 16.8310546875, 18.5390625, 20.2470703125, 21.955078125, 23.6630859375, 25.37109375, 27.0791015625, 28.787109375, 30.4951171875, 32.203125, 33.9111328125, 35.619140625, 37.3271484375, 39.03515625, 40.7431640625, 42.451171875, 44.1591796875, 45.8671875, 47.5751953125, 49.283203125, 50.9912109375, 52.69921875, 54.4072265625, 56.115234375, 57.8232421875, 59.53125]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 8.0, 156.0, 584.0, 250.0, 13.0, 6.0], "bins": [-253.69003295898438, -249.50735473632812, -245.32469177246094, -241.1420135498047, -236.9593505859375, -232.77667236328125, -228.59400939941406, -224.4113311767578, -220.22866821289062, -216.04598999023438, -211.8633270263672, -207.68064880371094, -203.49798583984375, -199.3153076171875, -195.1326446533203, -190.94996643066406, -186.76730346679688, -182.58462524414062, -178.40196228027344, -174.2192840576172, -170.03662109375, -165.85394287109375, -161.67127990722656, -157.4886016845703, -153.30592346191406, -149.1232452392578, -144.94058227539062, -140.75790405273438, -136.5752410888672, -132.39256286621094, -128.20989990234375, -124.0272216796875, -119.84456634521484, -115.66189575195312, -111.4792251586914, -107.29655456542969, -103.11388397216797, -98.93121337890625, -94.74853515625, -90.56587219238281, -86.38319396972656, -82.20052337646484, -78.01785278320312, -73.8351821899414, -69.65251159667969, -65.46984100341797, -61.287166595458984, -57.104496002197266, -52.92182922363281, -48.739158630371094, -44.556488037109375, -40.373817443847656, -36.19114685058594, -32.00847625732422, -27.825801849365234, -23.643131256103516, -19.460460662841797, -15.277790069580078, -11.095118522644043, -6.912446975708008, -2.729776382446289, 1.4528942108154297, 5.635566711425781, 9.8182373046875, 14.000907897949219]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 11.0, 1.0, 5.0, 5.0, 7.0, 12.0, 11.0, 7.0, 12.0, 11.0, 17.0, 18.0, 22.0, 20.0, 27.0, 28.0, 27.0, 44.0, 33.0, 46.0, 44.0, 48.0, 48.0, 40.0, 47.0, 44.0, 47.0, 42.0, 40.0, 23.0, 25.0, 33.0, 21.0, 24.0, 17.0, 16.0, 15.0, 15.0, 12.0, 11.0, 8.0, 7.0, 6.0, 2.0, 3.0, 5.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-48.866756439208984, -47.237186431884766, -45.60762023925781, -43.978050231933594, -42.34848403930664, -40.71891403198242, -39.08934783935547, -37.45977783203125, -35.83020782470703, -34.20063781738281, -32.57107162475586, -30.94150161743164, -29.311935424804688, -27.68236541748047, -26.052797317504883, -24.423229217529297, -22.793663024902344, -21.164094924926758, -19.534526824951172, -17.904956817626953, -16.275390625, -14.645821571350098, -13.016252517700195, -11.38668441772461, -9.757116317749023, -8.127548217773438, -6.497979640960693, -4.868411064147949, -3.2388429641723633, -1.6092748641967773, 0.020294189453125, 1.649862289428711, 3.2794342041015625, 4.909002304077148, 6.538570880889893, 8.168139457702637, 9.797707557678223, 11.427275657653809, 13.056844711303711, 14.686412811279297, 16.315980911254883, 17.94554901123047, 19.575117111206055, 21.20468521118164, 22.83425521850586, 24.463821411132812, 26.09339141845703, 27.722959518432617, 29.352527618408203, 30.98209571838379, 32.611663818359375, 34.241233825683594, 35.87080001831055, 37.500370025634766, 39.12993621826172, 40.75950622558594, 42.389076232910156, 44.018646240234375, 45.64821243286133, 47.27778244018555, 48.9073486328125, 50.53691864013672, 52.16648864746094, 53.79605484008789, 55.425621032714844]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 5.0, 6.0, 10.0, 9.0, 16.0, 12.0, 11.0, 22.0, 24.0, 31.0, 23.0, 29.0, 22.0, 34.0, 30.0, 39.0, 43.0, 58.0, 42.0, 42.0, 34.0, 43.0, 38.0, 37.0, 37.0, 39.0, 32.0, 46.0, 31.0, 22.0, 21.0, 19.0, 15.0, 14.0, 13.0, 11.0, 13.0, 6.0, 4.0, 9.0, 2.0, 5.0, 2.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.62890625, -5.4361572265625, -5.243408203125, -5.0506591796875, -4.85791015625, -4.6651611328125, -4.472412109375, -4.2796630859375, -4.0869140625, -3.8941650390625, -3.701416015625, -3.5086669921875, -3.31591796875, -3.1231689453125, -2.930419921875, -2.7376708984375, -2.544921875, -2.3521728515625, -2.159423828125, -1.9666748046875, -1.77392578125, -1.5811767578125, -1.388427734375, -1.1956787109375, -1.0029296875, -0.8101806640625, -0.617431640625, -0.4246826171875, -0.23193359375, -0.0391845703125, 0.153564453125, 0.3463134765625, 0.5390625, 0.7318115234375, 0.924560546875, 1.1173095703125, 1.31005859375, 1.5028076171875, 1.695556640625, 1.8883056640625, 2.0810546875, 2.2738037109375, 2.466552734375, 2.6593017578125, 2.85205078125, 3.0447998046875, 3.237548828125, 3.4302978515625, 3.623046875, 3.8157958984375, 4.008544921875, 4.2012939453125, 4.39404296875, 4.5867919921875, 4.779541015625, 4.9722900390625, 5.1650390625, 5.3577880859375, 5.550537109375, 5.7432861328125, 5.93603515625, 6.1287841796875, 6.321533203125, 6.5142822265625, 6.70703125]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 7.0, 10.0, 9.0, 8.0, 10.0, 17.0, 21.0, 23.0, 26.0, 20.0, 23.0, 27.0, 19.0, 52.0, 84.0, 229.0, 941.0, 5483.0, 97002.0, 3231045.0, 838919.0, 17329.0, 2066.0, 426.0, 147.0, 69.0, 43.0, 41.0, 28.0, 28.0, 17.0, 19.0, 16.0, 19.0, 15.0, 7.0, 8.0, 10.0, 6.0, 3.0, 4.0, 3.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.96875, -21.177001953125, -20.38525390625, -19.593505859375, -18.8017578125, -18.010009765625, -17.21826171875, -16.426513671875, -15.634765625, -14.843017578125, -14.05126953125, -13.259521484375, -12.4677734375, -11.676025390625, -10.88427734375, -10.092529296875, -9.30078125, -8.509033203125, -7.71728515625, -6.925537109375, -6.1337890625, -5.342041015625, -4.55029296875, -3.758544921875, -2.966796875, -2.175048828125, -1.38330078125, -0.591552734375, 0.2001953125, 0.991943359375, 1.78369140625, 2.575439453125, 3.3671875, 4.158935546875, 4.95068359375, 5.742431640625, 6.5341796875, 7.325927734375, 8.11767578125, 8.909423828125, 9.701171875, 10.492919921875, 11.28466796875, 12.076416015625, 12.8681640625, 13.659912109375, 14.45166015625, 15.243408203125, 16.03515625, 16.826904296875, 17.61865234375, 18.410400390625, 19.2021484375, 19.993896484375, 20.78564453125, 21.577392578125, 22.369140625, 23.160888671875, 23.95263671875, 24.744384765625, 25.5361328125, 26.327880859375, 27.11962890625, 27.911376953125, 28.703125]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 5.0, 6.0, 2.0, 8.0, 15.0, 12.0, 12.0, 17.0, 24.0, 30.0, 24.0, 50.0, 55.0, 67.0, 95.0, 97.0, 117.0, 164.0, 217.0, 255.0, 319.0, 358.0, 352.0, 345.0, 298.0, 235.0, 203.0, 152.0, 114.0, 102.0, 71.0, 68.0, 46.0, 31.0, 33.0, 19.0, 17.0, 14.0, 5.0, 3.0, 7.0, 6.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-10.625, -10.3140869140625, -10.003173828125, -9.6922607421875, -9.38134765625, -9.0704345703125, -8.759521484375, -8.4486083984375, -8.1376953125, -7.8267822265625, -7.515869140625, -7.2049560546875, -6.89404296875, -6.5831298828125, -6.272216796875, -5.9613037109375, -5.650390625, -5.3394775390625, -5.028564453125, -4.7176513671875, -4.40673828125, -4.0958251953125, -3.784912109375, -3.4739990234375, -3.1630859375, -2.8521728515625, -2.541259765625, -2.2303466796875, -1.91943359375, -1.6085205078125, -1.297607421875, -0.9866943359375, -0.67578125, -0.3648681640625, -0.053955078125, 0.2569580078125, 0.56787109375, 0.8787841796875, 1.189697265625, 1.5006103515625, 1.8115234375, 2.1224365234375, 2.433349609375, 2.7442626953125, 3.05517578125, 3.3660888671875, 3.677001953125, 3.9879150390625, 4.298828125, 4.6097412109375, 4.920654296875, 5.2315673828125, 5.54248046875, 5.8533935546875, 6.164306640625, 6.4752197265625, 6.7861328125, 7.0970458984375, 7.407958984375, 7.7188720703125, 8.02978515625, 8.3406982421875, 8.651611328125, 8.9625244140625, 9.2734375]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 3.0, 5.0, 2.0, 9.0, 13.0, 11.0, 26.0, 28.0, 26.0, 46.0, 63.0, 101.0, 149.0, 218.0, 312.0, 807.0, 6086.0, 371188.0, 3763225.0, 48539.0, 2017.0, 543.0, 266.0, 156.0, 118.0, 76.0, 67.0, 44.0, 41.0, 27.0, 25.0, 10.0, 9.0, 7.0, 12.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.84375, -38.3837890625, -36.923828125, -35.4638671875, -34.00390625, -32.5439453125, -31.083984375, -29.6240234375, -28.1640625, -26.7041015625, -25.244140625, -23.7841796875, -22.32421875, -20.8642578125, -19.404296875, -17.9443359375, -16.484375, -15.0244140625, -13.564453125, -12.1044921875, -10.64453125, -9.1845703125, -7.724609375, -6.2646484375, -4.8046875, -3.3447265625, -1.884765625, -0.4248046875, 1.03515625, 2.4951171875, 3.955078125, 5.4150390625, 6.875, 8.3349609375, 9.794921875, 11.2548828125, 12.71484375, 14.1748046875, 15.634765625, 17.0947265625, 18.5546875, 20.0146484375, 21.474609375, 22.9345703125, 24.39453125, 25.8544921875, 27.314453125, 28.7744140625, 30.234375, 31.6943359375, 33.154296875, 34.6142578125, 36.07421875, 37.5341796875, 38.994140625, 40.4541015625, 41.9140625, 43.3740234375, 44.833984375, 46.2939453125, 47.75390625, 49.2138671875, 50.673828125, 52.1337890625, 53.59375]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 9.0, 59.0, 173.0, 295.0, 310.0, 127.0, 36.0, 9.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-187.20521545410156, -181.99156188964844, -176.77792358398438, -171.56427001953125, -166.35061645507812, -161.136962890625, -155.92330932617188, -150.7096710205078, -145.4960174560547, -140.28236389160156, -135.0687255859375, -129.85507202148438, -124.64141845703125, -119.42776489257812, -114.21411895751953, -109.00047302246094, -103.78681945800781, -98.57316589355469, -93.3595199584961, -88.1458740234375, -82.93222045898438, -77.71856689453125, -72.50492095947266, -67.29127502441406, -62.07762145996094, -56.86397171020508, -51.65032196044922, -46.43667221069336, -41.2230224609375, -36.00937271118164, -30.79572296142578, -25.582073211669922, -20.368423461914062, -15.154773712158203, -9.941123962402344, -4.727474212646484, 0.486175537109375, 5.699825286865234, 10.913475036621094, 16.127124786376953, 21.340774536132812, 26.554424285888672, 31.76807403564453, 36.98172378540039, 42.19537353515625, 47.40902328491211, 52.62267303466797, 57.83632278442383, 63.04997253417969, 68.26362609863281, 73.4772720336914, 78.69091796875, 83.90457153320312, 89.11822509765625, 94.33187103271484, 99.54551696777344, 104.75917053222656, 109.97282409667969, 115.18647003173828, 120.40011596679688, 125.61376953125, 130.82742309570312, 136.04107666015625, 141.2547149658203, 146.46836853027344]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 9.0, 2.0, 6.0, 5.0, 8.0, 9.0, 17.0, 14.0, 15.0, 27.0, 21.0, 26.0, 46.0, 29.0, 35.0, 39.0, 39.0, 38.0, 43.0, 38.0, 38.0, 40.0, 31.0, 41.0, 35.0, 40.0, 33.0, 25.0, 43.0, 36.0, 25.0, 30.0, 22.0, 15.0, 24.0, 17.0, 5.0, 11.0, 7.0, 1.0, 10.0, 5.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-40.928253173828125, -39.651458740234375, -38.374664306640625, -37.09787368774414, -35.82107925415039, -34.54428482055664, -33.26749038696289, -31.99069595336914, -30.713903427124023, -29.437108993530273, -28.160316467285156, -26.883522033691406, -25.606727600097656, -24.32993507385254, -23.05314064025879, -21.776348114013672, -20.499553680419922, -19.222759246826172, -17.945966720581055, -16.669172286987305, -15.392378807067871, -14.115585327148438, -12.838790893554688, -11.561997413635254, -10.28520393371582, -9.008410453796387, -7.731616497039795, -6.454822540283203, -5.1780290603637695, -3.901235580444336, -2.624441623687744, -1.3476476669311523, -0.07085800170898438, 1.2059357166290283, 2.482729434967041, 3.7595231533050537, 5.036316871643066, 6.3131103515625, 7.589904308319092, 8.866698265075684, 10.143491744995117, 11.42028522491455, 12.697078704833984, 13.973873138427734, 15.250666618347168, 16.5274600982666, 17.80425453186035, 19.08104705810547, 20.35784149169922, 21.63463592529297, 22.911428451538086, 24.188222885131836, 25.465015411376953, 26.741809844970703, 28.018604278564453, 29.295398712158203, 30.57219123840332, 31.84898567199707, 33.12577819824219, 34.40257263183594, 35.67936706542969, 36.95616149902344, 38.23295211791992, 39.50974655151367, 40.78654098510742]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 7.0, 2.0, 10.0, 8.0, 14.0, 19.0, 14.0, 16.0, 26.0, 19.0, 25.0, 33.0, 42.0, 27.0, 45.0, 20.0, 49.0, 30.0, 43.0, 32.0, 47.0, 51.0, 48.0, 42.0, 46.0, 26.0, 50.0, 36.0, 23.0, 26.0, 18.0, 14.0, 22.0, 15.0, 10.0, 6.0, 10.0, 9.0, 4.0, 11.0, 4.0, 7.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.5234375, -5.32684326171875, -5.1302490234375, -4.93365478515625, -4.737060546875, -4.54046630859375, -4.3438720703125, -4.14727783203125, -3.95068359375, -3.75408935546875, -3.5574951171875, -3.36090087890625, -3.164306640625, -2.96771240234375, -2.7711181640625, -2.57452392578125, -2.3779296875, -2.18133544921875, -1.9847412109375, -1.78814697265625, -1.591552734375, -1.39495849609375, -1.1983642578125, -1.00177001953125, -0.80517578125, -0.60858154296875, -0.4119873046875, -0.21539306640625, -0.018798828125, 0.17779541015625, 0.3743896484375, 0.57098388671875, 0.767578125, 0.96417236328125, 1.1607666015625, 1.35736083984375, 1.553955078125, 1.75054931640625, 1.9471435546875, 2.14373779296875, 2.34033203125, 2.53692626953125, 2.7335205078125, 2.93011474609375, 3.126708984375, 3.32330322265625, 3.5198974609375, 3.71649169921875, 3.9130859375, 4.10968017578125, 4.3062744140625, 4.50286865234375, 4.699462890625, 4.89605712890625, 5.0926513671875, 5.28924560546875, 5.48583984375, 5.68243408203125, 5.8790283203125, 6.07562255859375, 6.272216796875, 6.46881103515625, 6.6654052734375, 6.86199951171875, 7.05859375]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 3.0, 10.0, 8.0, 23.0, 44.0, 58.0, 93.0, 140.0, 249.0, 402.0, 639.0, 1037.0, 1647.0, 2623.0, 4221.0, 6869.0, 11272.0, 19178.0, 32383.0, 56394.0, 97039.0, 159933.0, 213022.0, 175589.0, 109701.0, 64459.0, 36964.0, 21565.0, 12881.0, 7626.0, 4764.0, 2869.0, 1835.0, 1111.0, 689.0, 447.0, 285.0, 168.0, 121.0, 59.0, 40.0, 38.0, 15.0, 15.0, 7.0, 4.0, 9.0, 4.0, 1.0, 1.0, 2.0], "bins": [-0.7861328125, -0.7640609741210938, -0.7419891357421875, -0.7199172973632812, -0.697845458984375, -0.6757736206054688, -0.6537017822265625, -0.6316299438476562, -0.60955810546875, -0.5874862670898438, -0.5654144287109375, -0.5433425903320312, -0.521270751953125, -0.49919891357421875, -0.4771270751953125, -0.45505523681640625, -0.4329833984375, -0.41091156005859375, -0.3888397216796875, -0.36676788330078125, -0.344696044921875, -0.32262420654296875, -0.3005523681640625, -0.27848052978515625, -0.25640869140625, -0.23433685302734375, -0.2122650146484375, -0.19019317626953125, -0.168121337890625, -0.14604949951171875, -0.1239776611328125, -0.10190582275390625, -0.079833984375, -0.05776214599609375, -0.0356903076171875, -0.01361846923828125, 0.008453369140625, 0.03052520751953125, 0.0525970458984375, 0.07466888427734375, 0.09674072265625, 0.11881256103515625, 0.1408843994140625, 0.16295623779296875, 0.185028076171875, 0.20709991455078125, 0.2291717529296875, 0.25124359130859375, 0.2733154296875, 0.29538726806640625, 0.3174591064453125, 0.33953094482421875, 0.361602783203125, 0.38367462158203125, 0.4057464599609375, 0.42781829833984375, 0.44989013671875, 0.47196197509765625, 0.4940338134765625, 0.5161056518554688, 0.538177490234375, 0.5602493286132812, 0.5823211669921875, 0.6043930053710938, 0.62646484375]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 3.0, 3.0, 11.0, 12.0, 10.0, 11.0, 10.0, 19.0, 21.0, 20.0, 28.0, 28.0, 20.0, 31.0, 39.0, 33.0, 58.0, 44.0, 38.0, 1080.0, 51.0, 35.0, 42.0, 44.0, 31.0, 53.0, 35.0, 37.0, 38.0, 27.0, 26.0, 13.0, 15.0, 8.0, 13.0, 9.0, 9.0, 9.0, 8.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.5390625, -4.40118408203125, -4.2633056640625, -4.12542724609375, -3.987548828125, -3.84967041015625, -3.7117919921875, -3.57391357421875, -3.43603515625, -3.29815673828125, -3.1602783203125, -3.02239990234375, -2.884521484375, -2.74664306640625, -2.6087646484375, -2.47088623046875, -2.3330078125, -2.19512939453125, -2.0572509765625, -1.91937255859375, -1.781494140625, -1.64361572265625, -1.5057373046875, -1.36785888671875, -1.22998046875, -1.09210205078125, -0.9542236328125, -0.81634521484375, -0.678466796875, -0.54058837890625, -0.4027099609375, -0.26483154296875, -0.126953125, 0.01092529296875, 0.1488037109375, 0.28668212890625, 0.424560546875, 0.56243896484375, 0.7003173828125, 0.83819580078125, 0.97607421875, 1.11395263671875, 1.2518310546875, 1.38970947265625, 1.527587890625, 1.66546630859375, 1.8033447265625, 1.94122314453125, 2.0791015625, 2.21697998046875, 2.3548583984375, 2.49273681640625, 2.630615234375, 2.76849365234375, 2.9063720703125, 3.04425048828125, 3.18212890625, 3.32000732421875, 3.4578857421875, 3.59576416015625, 3.733642578125, 3.87152099609375, 4.0093994140625, 4.14727783203125, 4.28515625]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 4.0, 5.0, 5.0, 10.0, 17.0, 25.0, 32.0, 55.0, 69.0, 86.0, 172.0, 274.0, 424.0, 635.0, 1094.0, 1689.0, 2528.0, 3986.0, 6246.0, 9811.0, 15546.0, 24074.0, 37630.0, 58271.0, 87229.0, 121375.0, 506172.0, 843562.0, 122644.0, 87970.0, 58836.0, 38234.0, 24604.0, 15843.0, 10051.0, 6532.0, 4094.0, 2677.0, 1686.0, 1028.0, 650.0, 444.0, 297.0, 207.0, 115.0, 81.0, 49.0, 30.0, 15.0, 12.0, 7.0, 3.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.409423828125, -0.395782470703125, -0.38214111328125, -0.368499755859375, -0.3548583984375, -0.341217041015625, -0.32757568359375, -0.313934326171875, -0.30029296875, -0.286651611328125, -0.27301025390625, -0.259368896484375, -0.2457275390625, -0.232086181640625, -0.21844482421875, -0.204803466796875, -0.191162109375, -0.177520751953125, -0.16387939453125, -0.150238037109375, -0.1365966796875, -0.122955322265625, -0.10931396484375, -0.095672607421875, -0.08203125, -0.068389892578125, -0.05474853515625, -0.041107177734375, -0.0274658203125, -0.013824462890625, -0.00018310546875, 0.013458251953125, 0.027099609375, 0.040740966796875, 0.05438232421875, 0.068023681640625, 0.0816650390625, 0.095306396484375, 0.10894775390625, 0.122589111328125, 0.13623046875, 0.149871826171875, 0.16351318359375, 0.177154541015625, 0.1907958984375, 0.204437255859375, 0.21807861328125, 0.231719970703125, 0.245361328125, 0.259002685546875, 0.27264404296875, 0.286285400390625, 0.2999267578125, 0.313568115234375, 0.32720947265625, 0.340850830078125, 0.3544921875, 0.368133544921875, 0.38177490234375, 0.395416259765625, 0.4090576171875, 0.422698974609375, 0.43634033203125, 0.449981689453125, 0.463623046875]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 8.0, 4.0, 6.0, 3.0, 7.0, 6.0, 8.0, 13.0, 12.0, 21.0, 26.0, 17.0, 32.0, 35.0, 46.0, 41.0, 58.0, 79.0, 74.0, 64.0, 65.0, 52.0, 61.0, 49.0, 36.0, 29.0, 27.0, 19.0, 19.0, 18.0, 8.0, 11.0, 11.0, 7.0, 5.0, 5.0, 7.0, 2.0, 4.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00431060791015625, -0.004188179969787598, -0.004065752029418945, -0.003943324089050293, -0.0038208961486816406, -0.0036984682083129883, -0.003576040267944336, -0.0034536123275756836, -0.0033311843872070312, -0.003208756446838379, -0.0030863285064697266, -0.0029639005661010742, -0.002841472625732422, -0.0027190446853637695, -0.002596616744995117, -0.002474188804626465, -0.0023517608642578125, -0.00222933292388916, -0.002106904983520508, -0.0019844770431518555, -0.0018620491027832031, -0.0017396211624145508, -0.0016171932220458984, -0.001494765281677246, -0.0013723373413085938, -0.0012499094009399414, -0.001127481460571289, -0.0010050535202026367, -0.0008826255798339844, -0.000760197639465332, -0.0006377696990966797, -0.0005153417587280273, -0.000392913818359375, -0.00027048587799072266, -0.0001480579376220703, -2.562999725341797e-05, 9.679794311523438e-05, 0.00021922588348388672, 0.00034165382385253906, 0.0004640817642211914, 0.0005865097045898438, 0.0007089376449584961, 0.0008313655853271484, 0.0009537935256958008, 0.0010762214660644531, 0.0011986494064331055, 0.0013210773468017578, 0.0014435052871704102, 0.0015659332275390625, 0.0016883611679077148, 0.0018107891082763672, 0.0019332170486450195, 0.002055644989013672, 0.0021780729293823242, 0.0023005008697509766, 0.002422928810119629, 0.0025453567504882812, 0.0026677846908569336, 0.002790212631225586, 0.0029126405715942383, 0.0030350685119628906, 0.003157496452331543, 0.0032799243927001953, 0.0034023523330688477, 0.0035247802734375]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 2.0, 4.0, 2.0, 1.0, 7.0, 11.0, 6.0, 12.0, 18.0, 17.0, 23.0, 22.0, 35.0, 57.0, 63.0, 126.0, 183.0, 316.0, 885.0, 34974.0, 1003709.0, 6674.0, 590.0, 279.0, 171.0, 107.0, 69.0, 28.0, 38.0, 29.0, 19.0, 14.0, 15.0, 18.0, 8.0, 3.0, 3.0, 5.0, 6.0, 3.0, 3.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.08575439453125, -0.08301925659179688, -0.08028411865234375, -0.07754898071289062, -0.0748138427734375, -0.07207870483398438, -0.06934356689453125, -0.06660842895507812, -0.063873291015625, -0.061138153076171875, -0.05840301513671875, -0.055667877197265625, -0.0529327392578125, -0.050197601318359375, -0.04746246337890625, -0.044727325439453125, -0.0419921875, -0.039257049560546875, -0.03652191162109375, -0.033786773681640625, -0.0310516357421875, -0.028316497802734375, -0.02558135986328125, -0.022846221923828125, -0.020111083984375, -0.017375946044921875, -0.01464080810546875, -0.011905670166015625, -0.0091705322265625, -0.006435394287109375, -0.00370025634765625, -0.000965118408203125, 0.00177001953125, 0.004505157470703125, 0.00724029541015625, 0.009975433349609375, 0.0127105712890625, 0.015445709228515625, 0.01818084716796875, 0.020915985107421875, 0.023651123046875, 0.026386260986328125, 0.02912139892578125, 0.031856536865234375, 0.0345916748046875, 0.037326812744140625, 0.04006195068359375, 0.042797088623046875, 0.0455322265625, 0.048267364501953125, 0.05100250244140625, 0.053737640380859375, 0.0564727783203125, 0.059207916259765625, 0.06194305419921875, 0.06467819213867188, 0.067413330078125, 0.07014846801757812, 0.07288360595703125, 0.07561874389648438, 0.0783538818359375, 0.08108901977539062, 0.08382415771484375, 0.08655929565429688, 0.08929443359375]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 10.0, 174.0, 731.0, 93.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0030269038397818804, -0.002339038299396634, -0.001651172642596066, -0.0009633069857954979, -0.0002754414454102516, 0.00041242409497499466, 0.0011002898681908846, 0.0017881554085761309, 0.002476020948961377, 0.0031638864893466234, 0.0038517522625625134, 0.00453961780294776, 0.005227483343333006, 0.005915348883718252, 0.006603214889764786, 0.007291080430150032, 0.007978945970535278, 0.008666811510920525, 0.009354677051305771, 0.010042542591691017, 0.010730408132076263, 0.01141827367246151, 0.012106139212846756, 0.012794004753232002, 0.013481870293617249, 0.014169735834002495, 0.014857601374387741, 0.015545466914772987, 0.016233332455158234, 0.01692119799554348, 0.017609063535928726, 0.018296929076313972, 0.018984796479344368, 0.019672662019729614, 0.02036052756011486, 0.021048393100500107, 0.021736258640885353, 0.0224241241812706, 0.023111989721655846, 0.023799855262041092, 0.024487720802426338, 0.025175586342811584, 0.02586345188319683, 0.026551317423582077, 0.027239182963967323, 0.02792704850435257, 0.028614914044737816, 0.029302779585123062, 0.029990646988153458, 0.030678512528538704, 0.03136637806892395, 0.032054245471954346, 0.03274210914969444, 0.03342997655272484, 0.034117840230464935, 0.03480570763349533, 0.03549357131123543, 0.03618143871426582, 0.03686930239200592, 0.037557169795036316, 0.03824503347277641, 0.03893290087580681, 0.039620764553546906, 0.0403086319565773, 0.0409964956343174]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 2.0, 2.0, 8.0, 12.0, 15.0, 17.0, 25.0, 28.0, 30.0, 35.0, 35.0, 50.0, 35.0, 38.0, 53.0, 41.0, 39.0, 39.0, 47.0, 51.0, 53.0, 45.0, 52.0, 37.0, 30.0, 26.0, 29.0, 21.0, 21.0, 14.0, 11.0, 16.0, 12.0, 14.0, 7.0, 1.0, 7.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0028460025787353516, -0.002757125534117222, -0.002668248489499092, -0.0025793714448809624, -0.0024904944002628326, -0.002401617355644703, -0.002312740311026573, -0.0022238632664084435, -0.0021349862217903137, -0.002046109177172184, -0.0019572321325540543, -0.0018683550879359245, -0.0017794780433177948, -0.001690600998699665, -0.0016017239540815353, -0.0015128469094634056, -0.0014239698648452759, -0.0013350928202271461, -0.0012462157756090164, -0.0011573387309908867, -0.001068461686372757, -0.0009795846417546272, -0.0008907075971364975, -0.0008018305525183678, -0.000712953507900238, -0.0006240764632821083, -0.0005351994186639786, -0.00044632237404584885, -0.0003574453294277191, -0.0002685682848095894, -0.00017969124019145966, -9.081419557332993e-05, -1.9371509552001953e-06, 8.693989366292953e-05, 0.00017581693828105927, 0.000264693982899189, 0.0003535710275173187, 0.00044244807213544846, 0.0005313251167535782, 0.0006202021613717079, 0.0007090792059898376, 0.0007979562506079674, 0.0008868332952260971, 0.0009757103398442268, 0.0010645873844623566, 0.0011534644290804863, 0.001242341473698616, 0.0013312185183167458, 0.0014200955629348755, 0.0015089726075530052, 0.001597849652171135, 0.0016867266967892647, 0.0017756037414073944, 0.0018644807860255241, 0.001953357830643654, 0.0020422348752617836, 0.0021311119198799133, 0.002219988964498043, 0.002308866009116173, 0.0023977430537343025, 0.0024866200983524323, 0.002575497142970562, 0.0026643741875886917, 0.0027532512322068214, 0.002842128276824951]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 7.0, 2.0, 10.0, 8.0, 14.0, 19.0, 14.0, 16.0, 26.0, 19.0, 25.0, 33.0, 42.0, 27.0, 46.0, 19.0, 49.0, 30.0, 43.0, 32.0, 47.0, 51.0, 48.0, 42.0, 46.0, 26.0, 50.0, 36.0, 23.0, 26.0, 18.0, 14.0, 22.0, 15.0, 10.0, 6.0, 10.0, 9.0, 4.0, 11.0, 4.0, 7.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.5234375, -5.32684326171875, -5.1302490234375, -4.93365478515625, -4.737060546875, -4.54046630859375, -4.3438720703125, -4.14727783203125, -3.95068359375, -3.75408935546875, -3.5574951171875, -3.36090087890625, -3.164306640625, -2.96771240234375, -2.7711181640625, -2.57452392578125, -2.3779296875, -2.18133544921875, -1.9847412109375, -1.78814697265625, -1.591552734375, -1.39495849609375, -1.1983642578125, -1.00177001953125, -0.80517578125, -0.60858154296875, -0.4119873046875, -0.21539306640625, -0.018798828125, 0.17779541015625, 0.3743896484375, 0.57098388671875, 0.767578125, 0.96417236328125, 1.1607666015625, 1.35736083984375, 1.553955078125, 1.75054931640625, 1.9471435546875, 2.14373779296875, 2.34033203125, 2.53692626953125, 2.7335205078125, 2.93011474609375, 3.126708984375, 3.32330322265625, 3.5198974609375, 3.71649169921875, 3.9130859375, 4.10968017578125, 4.3062744140625, 4.50286865234375, 4.699462890625, 4.89605712890625, 5.0926513671875, 5.28924560546875, 5.48583984375, 5.68243408203125, 5.8790283203125, 6.07562255859375, 6.272216796875, 6.46881103515625, 6.6654052734375, 6.86199951171875, 7.05859375]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 3.0, 5.0, 11.0, 10.0, 16.0, 14.0, 20.0, 31.0, 59.0, 79.0, 115.0, 183.0, 341.0, 550.0, 965.0, 1789.0, 3440.0, 6680.0, 14493.0, 39002.0, 123582.0, 447300.0, 279982.0, 80562.0, 27073.0, 10958.0, 5087.0, 2693.0, 1473.0, 821.0, 484.0, 276.0, 153.0, 98.0, 61.0, 42.0, 26.0, 27.0, 19.0, 7.0, 8.0, 7.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.62109375, -5.438720703125, -5.25634765625, -5.073974609375, -4.8916015625, -4.709228515625, -4.52685546875, -4.344482421875, -4.162109375, -3.979736328125, -3.79736328125, -3.614990234375, -3.4326171875, -3.250244140625, -3.06787109375, -2.885498046875, -2.703125, -2.520751953125, -2.33837890625, -2.156005859375, -1.9736328125, -1.791259765625, -1.60888671875, -1.426513671875, -1.244140625, -1.061767578125, -0.87939453125, -0.697021484375, -0.5146484375, -0.332275390625, -0.14990234375, 0.032470703125, 0.21484375, 0.397216796875, 0.57958984375, 0.761962890625, 0.9443359375, 1.126708984375, 1.30908203125, 1.491455078125, 1.673828125, 1.856201171875, 2.03857421875, 2.220947265625, 2.4033203125, 2.585693359375, 2.76806640625, 2.950439453125, 3.1328125, 3.315185546875, 3.49755859375, 3.679931640625, 3.8623046875, 4.044677734375, 4.22705078125, 4.409423828125, 4.591796875, 4.774169921875, 4.95654296875, 5.138916015625, 5.3212890625, 5.503662109375, 5.68603515625, 5.868408203125, 6.05078125]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 2.0, 4.0, 7.0, 9.0, 10.0, 7.0, 15.0, 13.0, 13.0, 10.0, 24.0, 18.0, 27.0, 30.0, 35.0, 36.0, 32.0, 41.0, 61.0, 51.0, 69.0, 140.0, 1481.0, 322.0, 125.0, 80.0, 46.0, 38.0, 43.0, 32.0, 31.0, 31.0, 23.0, 28.0, 23.0, 16.0, 16.0, 15.0, 11.0, 9.0, 4.0, 7.0, 5.0, 2.0, 1.0, 2.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-19.09375, -18.49560546875, -17.8974609375, -17.29931640625, -16.701171875, -16.10302734375, -15.5048828125, -14.90673828125, -14.30859375, -13.71044921875, -13.1123046875, -12.51416015625, -11.916015625, -11.31787109375, -10.7197265625, -10.12158203125, -9.5234375, -8.92529296875, -8.3271484375, -7.72900390625, -7.130859375, -6.53271484375, -5.9345703125, -5.33642578125, -4.73828125, -4.14013671875, -3.5419921875, -2.94384765625, -2.345703125, -1.74755859375, -1.1494140625, -0.55126953125, 0.046875, 0.64501953125, 1.2431640625, 1.84130859375, 2.439453125, 3.03759765625, 3.6357421875, 4.23388671875, 4.83203125, 5.43017578125, 6.0283203125, 6.62646484375, 7.224609375, 7.82275390625, 8.4208984375, 9.01904296875, 9.6171875, 10.21533203125, 10.8134765625, 11.41162109375, 12.009765625, 12.60791015625, 13.2060546875, 13.80419921875, 14.40234375, 15.00048828125, 15.5986328125, 16.19677734375, 16.794921875, 17.39306640625, 17.9912109375, 18.58935546875, 19.1875]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 8.0, 11.0, 21.0, 22.0, 48.0, 50.0, 94.0, 138.0, 198.0, 355.0, 845.0, 17680.0, 3120232.0, 4380.0, 695.0, 342.0, 194.0, 135.0, 77.0, 58.0, 31.0, 36.0, 14.0, 14.0, 8.0, 11.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-98.1875, -95.75537109375, -93.3232421875, -90.89111328125, -88.458984375, -86.02685546875, -83.5947265625, -81.16259765625, -78.73046875, -76.29833984375, -73.8662109375, -71.43408203125, -69.001953125, -66.56982421875, -64.1376953125, -61.70556640625, -59.2734375, -56.84130859375, -54.4091796875, -51.97705078125, -49.544921875, -47.11279296875, -44.6806640625, -42.24853515625, -39.81640625, -37.38427734375, -34.9521484375, -32.52001953125, -30.087890625, -27.65576171875, -25.2236328125, -22.79150390625, -20.359375, -17.92724609375, -15.4951171875, -13.06298828125, -10.630859375, -8.19873046875, -5.7666015625, -3.33447265625, -0.90234375, 1.52978515625, 3.9619140625, 6.39404296875, 8.826171875, 11.25830078125, 13.6904296875, 16.12255859375, 18.5546875, 20.98681640625, 23.4189453125, 25.85107421875, 28.283203125, 30.71533203125, 33.1474609375, 35.57958984375, 38.01171875, 40.44384765625, 42.8759765625, 45.30810546875, 47.740234375, 50.17236328125, 52.6044921875, 55.03662109375, 57.46875]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 7.0, 29.0, 165.0, 345.0, 291.0, 139.0, 30.0, 6.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.14201354980469, -51.978763580322266, -49.815513610839844, -47.652259826660156, -45.489009857177734, -43.32575988769531, -41.16250991821289, -38.99925994873047, -36.83600616455078, -34.67275619506836, -32.50950622558594, -30.346254348754883, -28.183002471923828, -26.019752502441406, -23.856502532958984, -21.693252563476562, -19.53000259399414, -17.36675262451172, -15.203500747680664, -13.040250778198242, -10.876999855041504, -8.713748931884766, -6.550498962402344, -4.3872480392456055, -2.223997116088867, -0.06074643135070801, 2.102504253387451, 4.265754699707031, 6.4290056228637695, 8.592256546020508, 10.75550651550293, 12.918757438659668, 15.082008361816406, 17.245258331298828, 19.408510208129883, 21.571760177612305, 23.73501205444336, 25.89826202392578, 28.061511993408203, 30.224761962890625, 32.38801574707031, 34.551265716552734, 36.714515686035156, 38.877769470214844, 41.041019439697266, 43.20426940917969, 45.36751937866211, 47.53076934814453, 49.69401931762695, 51.857269287109375, 54.0205192565918, 56.18376922607422, 58.347023010253906, 60.51027297973633, 62.67352294921875, 64.83677673339844, 67.0000228881836, 69.16327667236328, 71.32652282714844, 73.48977661132812, 75.65302276611328, 77.81627655029297, 79.97952270507812, 82.14277648925781, 84.3060302734375]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 8.0, 6.0, 3.0, 6.0, 9.0, 5.0, 16.0, 15.0, 13.0, 18.0, 17.0, 21.0, 20.0, 24.0, 25.0, 23.0, 28.0, 40.0, 42.0, 31.0, 42.0, 50.0, 33.0, 47.0, 35.0, 29.0, 41.0, 35.0, 38.0, 27.0, 36.0, 27.0, 33.0, 24.0, 19.0, 16.0, 11.0, 12.0, 14.0, 9.0, 7.0, 11.0, 9.0, 10.0, 8.0, 5.0, 1.0, 1.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-53.2945556640625, -51.62506866455078, -49.95558166503906, -48.286094665527344, -46.616607666015625, -44.947120666503906, -43.27763748168945, -41.608150482177734, -39.938663482666016, -38.2691764831543, -36.59968948364258, -34.93020248413086, -33.260719299316406, -31.591230392456055, -29.92174530029297, -28.25225830078125, -26.58277130126953, -24.913284301757812, -23.243797302246094, -21.574312210083008, -19.90482521057129, -18.23533821105957, -16.565853118896484, -14.896366119384766, -13.226879119873047, -11.557392120361328, -9.887906074523926, -8.218420028686523, -6.548933029174805, -4.879446029663086, -3.2099599838256836, -1.5404739379882812, 0.1290130615234375, 1.798499584197998, 3.4679861068725586, 5.137472629547119, 6.80695915222168, 8.476446151733398, 10.1459321975708, 11.815418243408203, 13.484905242919922, 15.15439224243164, 16.82387924194336, 18.493364334106445, 20.162851333618164, 21.832338333129883, 23.50182342529297, 25.171310424804688, 26.840797424316406, 28.510284423828125, 30.179771423339844, 31.84925651550293, 33.51874542236328, 35.188232421875, 36.85771560668945, 38.52720260620117, 40.19668960571289, 41.86617660522461, 43.53566360473633, 45.20515060424805, 46.8746337890625, 48.54412078857422, 50.21360778808594, 51.883094787597656, 53.552581787109375]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 9.0, 10.0, 13.0, 12.0, 23.0, 17.0, 20.0, 24.0, 18.0, 34.0, 40.0, 33.0, 34.0, 48.0, 35.0, 34.0, 36.0, 44.0, 46.0, 48.0, 51.0, 43.0, 39.0, 38.0, 44.0, 24.0, 34.0, 17.0, 29.0, 14.0, 26.0, 16.0, 8.0, 7.0, 2.0, 11.0, 6.0, 6.0, 2.0, 8.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.09765625, -5.880126953125, -5.66259765625, -5.445068359375, -5.2275390625, -5.010009765625, -4.79248046875, -4.574951171875, -4.357421875, -4.139892578125, -3.92236328125, -3.704833984375, -3.4873046875, -3.269775390625, -3.05224609375, -2.834716796875, -2.6171875, -2.399658203125, -2.18212890625, -1.964599609375, -1.7470703125, -1.529541015625, -1.31201171875, -1.094482421875, -0.876953125, -0.659423828125, -0.44189453125, -0.224365234375, -0.0068359375, 0.210693359375, 0.42822265625, 0.645751953125, 0.86328125, 1.080810546875, 1.29833984375, 1.515869140625, 1.7333984375, 1.950927734375, 2.16845703125, 2.385986328125, 2.603515625, 2.821044921875, 3.03857421875, 3.256103515625, 3.4736328125, 3.691162109375, 3.90869140625, 4.126220703125, 4.34375, 4.561279296875, 4.77880859375, 4.996337890625, 5.2138671875, 5.431396484375, 5.64892578125, 5.866455078125, 6.083984375, 6.301513671875, 6.51904296875, 6.736572265625, 6.9541015625, 7.171630859375, 7.38916015625, 7.606689453125, 7.82421875]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 0.0, 6.0, 2.0, 7.0, 11.0, 12.0, 16.0, 22.0, 23.0, 24.0, 24.0, 31.0, 37.0, 45.0, 65.0, 139.0, 476.0, 2103.0, 16446.0, 531872.0, 3454642.0, 177468.0, 8556.0, 1462.0, 357.0, 129.0, 73.0, 45.0, 36.0, 29.0, 24.0, 23.0, 17.0, 16.0, 8.0, 11.0, 5.0, 9.0, 2.0, 7.0, 9.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.453125, -21.661865234375, -20.87060546875, -20.079345703125, -19.2880859375, -18.496826171875, -17.70556640625, -16.914306640625, -16.123046875, -15.331787109375, -14.54052734375, -13.749267578125, -12.9580078125, -12.166748046875, -11.37548828125, -10.584228515625, -9.79296875, -9.001708984375, -8.21044921875, -7.419189453125, -6.6279296875, -5.836669921875, -5.04541015625, -4.254150390625, -3.462890625, -2.671630859375, -1.88037109375, -1.089111328125, -0.2978515625, 0.493408203125, 1.28466796875, 2.075927734375, 2.8671875, 3.658447265625, 4.44970703125, 5.240966796875, 6.0322265625, 6.823486328125, 7.61474609375, 8.406005859375, 9.197265625, 9.988525390625, 10.77978515625, 11.571044921875, 12.3623046875, 13.153564453125, 13.94482421875, 14.736083984375, 15.52734375, 16.318603515625, 17.10986328125, 17.901123046875, 18.6923828125, 19.483642578125, 20.27490234375, 21.066162109375, 21.857421875, 22.648681640625, 23.43994140625, 24.231201171875, 25.0224609375, 25.813720703125, 26.60498046875, 27.396240234375, 28.1875]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 8.0, 6.0, 6.0, 12.0, 23.0, 17.0, 28.0, 28.0, 50.0, 53.0, 78.0, 100.0, 138.0, 170.0, 278.0, 350.0, 404.0, 497.0, 435.0, 359.0, 251.0, 196.0, 161.0, 122.0, 79.0, 74.0, 49.0, 25.0, 22.0, 18.0, 10.0, 8.0, 8.0, 3.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-11.5859375, -11.1800537109375, -10.774169921875, -10.3682861328125, -9.96240234375, -9.5565185546875, -9.150634765625, -8.7447509765625, -8.3388671875, -7.9329833984375, -7.527099609375, -7.1212158203125, -6.71533203125, -6.3094482421875, -5.903564453125, -5.4976806640625, -5.091796875, -4.6859130859375, -4.280029296875, -3.8741455078125, -3.46826171875, -3.0623779296875, -2.656494140625, -2.2506103515625, -1.8447265625, -1.4388427734375, -1.032958984375, -0.6270751953125, -0.22119140625, 0.1846923828125, 0.590576171875, 0.9964599609375, 1.40234375, 1.8082275390625, 2.214111328125, 2.6199951171875, 3.02587890625, 3.4317626953125, 3.837646484375, 4.2435302734375, 4.6494140625, 5.0552978515625, 5.461181640625, 5.8670654296875, 6.27294921875, 6.6788330078125, 7.084716796875, 7.4906005859375, 7.896484375, 8.3023681640625, 8.708251953125, 9.1141357421875, 9.52001953125, 9.9259033203125, 10.331787109375, 10.7376708984375, 11.1435546875, 11.5494384765625, 11.955322265625, 12.3612060546875, 12.76708984375, 13.1729736328125, 13.578857421875, 13.9847412109375, 14.390625]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 7.0, 6.0, 14.0, 10.0, 16.0, 33.0, 26.0, 35.0, 51.0, 99.0, 98.0, 148.0, 171.0, 234.0, 312.0, 706.0, 3268.0, 134564.0, 3938568.0, 111124.0, 2926.0, 636.0, 301.0, 215.0, 164.0, 108.0, 103.0, 62.0, 59.0, 62.0, 37.0, 36.0, 21.0, 18.0, 10.0, 19.0, 8.0, 3.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0], "bins": [-54.0625, -52.58056640625, -51.0986328125, -49.61669921875, -48.134765625, -46.65283203125, -45.1708984375, -43.68896484375, -42.20703125, -40.72509765625, -39.2431640625, -37.76123046875, -36.279296875, -34.79736328125, -33.3154296875, -31.83349609375, -30.3515625, -28.86962890625, -27.3876953125, -25.90576171875, -24.423828125, -22.94189453125, -21.4599609375, -19.97802734375, -18.49609375, -17.01416015625, -15.5322265625, -14.05029296875, -12.568359375, -11.08642578125, -9.6044921875, -8.12255859375, -6.640625, -5.15869140625, -3.6767578125, -2.19482421875, -0.712890625, 0.76904296875, 2.2509765625, 3.73291015625, 5.21484375, 6.69677734375, 8.1787109375, 9.66064453125, 11.142578125, 12.62451171875, 14.1064453125, 15.58837890625, 17.0703125, 18.55224609375, 20.0341796875, 21.51611328125, 22.998046875, 24.47998046875, 25.9619140625, 27.44384765625, 28.92578125, 30.40771484375, 31.8896484375, 33.37158203125, 34.853515625, 36.33544921875, 37.8173828125, 39.29931640625, 40.78125]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 6.0, 4.0, 7.0, 17.0, 25.0, 59.0, 83.0, 119.0, 158.0, 128.0, 137.0, 107.0, 67.0, 50.0, 21.0, 10.0, 11.0, 3.0, 0.0, 2.0, 1.0, 1.0], "bins": [-115.23910522460938, -112.9880599975586, -110.73701477050781, -108.48597717285156, -106.23493194580078, -103.98388671875, -101.73284912109375, -99.48180389404297, -97.23075866699219, -94.9797134399414, -92.72866821289062, -90.47763061523438, -88.2265853881836, -85.97554016113281, -83.72450256347656, -81.47345733642578, -79.222412109375, -76.97136688232422, -74.72032165527344, -72.46928405761719, -70.2182388305664, -67.96719360351562, -65.71615600585938, -63.465110778808594, -61.21406555175781, -58.96302032470703, -56.711978912353516, -54.4609375, -52.20989227294922, -49.95884704589844, -47.70780563354492, -45.456764221191406, -43.205718994140625, -40.954673767089844, -38.70363235473633, -36.45259094238281, -34.20154571533203, -31.950502395629883, -29.699459075927734, -27.448415756225586, -25.197372436523438, -22.94632911682129, -20.69528579711914, -18.444242477416992, -16.193199157714844, -13.942155838012695, -11.691112518310547, -9.440069198608398, -7.18902587890625, -4.937982559204102, -2.686939239501953, -0.4358959197998047, 1.8151473999023438, 4.066190719604492, 6.317234039306641, 8.568277359008789, 10.819320678710938, 13.070363998413086, 15.321407318115234, 17.572450637817383, 19.82349395751953, 22.07453727722168, 24.325580596923828, 26.576623916625977, 28.827667236328125]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 2.0, 5.0, 6.0, 5.0, 7.0, 9.0, 10.0, 5.0, 13.0, 13.0, 13.0, 23.0, 24.0, 20.0, 32.0, 32.0, 28.0, 28.0, 34.0, 32.0, 32.0, 41.0, 39.0, 33.0, 50.0, 38.0, 40.0, 44.0, 35.0, 38.0, 30.0, 30.0, 33.0, 20.0, 21.0, 19.0, 22.0, 20.0, 9.0, 19.0, 12.0, 7.0, 5.0, 7.0, 6.0, 5.0, 3.0, 2.0, 1.0, 6.0, 1.0, 3.0, 0.0, 2.0], "bins": [-43.00483703613281, -41.735206604003906, -40.465576171875, -39.195945739746094, -37.92631530761719, -36.65668487548828, -35.387054443359375, -34.11742401123047, -32.84779357910156, -31.578163146972656, -30.30853271484375, -29.038902282714844, -27.769271850585938, -26.49964141845703, -25.230010986328125, -23.96038055419922, -22.69074821472168, -21.421117782592773, -20.151487350463867, -18.88185691833496, -17.612226486206055, -16.34259605407715, -15.072964668273926, -13.80333423614502, -12.533703804016113, -11.264073371887207, -9.9944429397583, -8.724811553955078, -7.45518159866333, -6.185551166534424, -4.915920257568359, -3.646289825439453, -2.376659393310547, -1.107028841972351, 0.16260170936584473, 1.43223237991333, 2.7018628120422363, 3.9714932441711426, 5.241124153137207, 6.510754585266113, 7.7803850173950195, 9.050015449523926, 10.319645881652832, 11.589277267456055, 12.858907699584961, 14.128538131713867, 15.398168563842773, 16.66779899597168, 17.937429428100586, 19.207059860229492, 20.4766902923584, 21.746320724487305, 23.01595115661621, 24.285581588745117, 25.555213928222656, 26.824844360351562, 28.09447479248047, 29.364105224609375, 30.63373565673828, 31.903366088867188, 33.172996520996094, 34.442626953125, 35.712257385253906, 36.98188781738281, 38.25151824951172]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 6.0, 13.0, 10.0, 6.0, 8.0, 11.0, 22.0, 15.0, 25.0, 22.0, 17.0, 21.0, 26.0, 31.0, 34.0, 36.0, 47.0, 40.0, 29.0, 44.0, 41.0, 32.0, 44.0, 43.0, 38.0, 35.0, 33.0, 37.0, 28.0, 25.0, 28.0, 20.0, 22.0, 21.0, 16.0, 17.0, 4.0, 7.0, 13.0, 4.0, 9.0, 6.0, 3.0, 5.0, 4.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.26171875, -5.07354736328125, -4.8853759765625, -4.69720458984375, -4.509033203125, -4.32086181640625, -4.1326904296875, -3.94451904296875, -3.75634765625, -3.56817626953125, -3.3800048828125, -3.19183349609375, -3.003662109375, -2.81549072265625, -2.6273193359375, -2.43914794921875, -2.2509765625, -2.06280517578125, -1.8746337890625, -1.68646240234375, -1.498291015625, -1.31011962890625, -1.1219482421875, -0.93377685546875, -0.74560546875, -0.55743408203125, -0.3692626953125, -0.18109130859375, 0.007080078125, 0.19525146484375, 0.3834228515625, 0.57159423828125, 0.759765625, 0.94793701171875, 1.1361083984375, 1.32427978515625, 1.512451171875, 1.70062255859375, 1.8887939453125, 2.07696533203125, 2.26513671875, 2.45330810546875, 2.6414794921875, 2.82965087890625, 3.017822265625, 3.20599365234375, 3.3941650390625, 3.58233642578125, 3.7705078125, 3.95867919921875, 4.1468505859375, 4.33502197265625, 4.523193359375, 4.71136474609375, 4.8995361328125, 5.08770751953125, 5.27587890625, 5.46405029296875, 5.6522216796875, 5.84039306640625, 6.028564453125, 6.21673583984375, 6.4049072265625, 6.59307861328125, 6.78125]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 7.0, 26.0, 21.0, 30.0, 67.0, 69.0, 115.0, 162.0, 273.0, 385.0, 583.0, 1000.0, 1649.0, 2700.0, 4519.0, 7448.0, 12728.0, 22059.0, 38313.0, 68366.0, 120543.0, 193181.0, 217486.0, 151132.0, 88146.0, 49291.0, 28197.0, 16300.0, 9444.0, 5595.0, 3291.0, 2009.0, 1240.0, 783.0, 490.0, 303.0, 209.0, 141.0, 69.0, 63.0, 27.0, 25.0, 20.0, 9.0, 15.0, 10.0, 3.0, 2.0, 1.0, 8.0, 1.0, 2.0], "bins": [-0.8544921875, -0.8295211791992188, -0.8045501708984375, -0.7795791625976562, -0.754608154296875, -0.7296371459960938, -0.7046661376953125, -0.6796951293945312, -0.65472412109375, -0.6297531127929688, -0.6047821044921875, -0.5798110961914062, -0.554840087890625, -0.5298690795898438, -0.5048980712890625, -0.47992706298828125, -0.4549560546875, -0.42998504638671875, -0.4050140380859375, -0.38004302978515625, -0.355072021484375, -0.33010101318359375, -0.3051300048828125, -0.28015899658203125, -0.25518798828125, -0.23021697998046875, -0.2052459716796875, -0.18027496337890625, -0.155303955078125, -0.13033294677734375, -0.1053619384765625, -0.08039093017578125, -0.055419921875, -0.03044891357421875, -0.0054779052734375, 0.01949310302734375, 0.044464111328125, 0.06943511962890625, 0.0944061279296875, 0.11937713623046875, 0.14434814453125, 0.16931915283203125, 0.1942901611328125, 0.21926116943359375, 0.244232177734375, 0.26920318603515625, 0.2941741943359375, 0.31914520263671875, 0.3441162109375, 0.36908721923828125, 0.3940582275390625, 0.41902923583984375, 0.444000244140625, 0.46897125244140625, 0.4939422607421875, 0.5189132690429688, 0.54388427734375, 0.5688552856445312, 0.5938262939453125, 0.6187973022460938, 0.643768310546875, 0.6687393188476562, 0.6937103271484375, 0.7186813354492188, 0.74365234375]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 9.0, 2.0, 4.0, 11.0, 13.0, 13.0, 14.0, 11.0, 13.0, 19.0, 26.0, 21.0, 32.0, 28.0, 30.0, 36.0, 31.0, 32.0, 32.0, 37.0, 36.0, 32.0, 1066.0, 37.0, 36.0, 38.0, 31.0, 38.0, 26.0, 36.0, 25.0, 23.0, 26.0, 26.0, 19.0, 16.0, 7.0, 17.0, 11.0, 16.0, 14.0, 8.0, 4.0, 6.0, 6.0, 5.0, 6.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.509765625, -3.39788818359375, -3.2860107421875, -3.17413330078125, -3.062255859375, -2.95037841796875, -2.8385009765625, -2.72662353515625, -2.61474609375, -2.50286865234375, -2.3909912109375, -2.27911376953125, -2.167236328125, -2.05535888671875, -1.9434814453125, -1.83160400390625, -1.7197265625, -1.60784912109375, -1.4959716796875, -1.38409423828125, -1.272216796875, -1.16033935546875, -1.0484619140625, -0.93658447265625, -0.82470703125, -0.71282958984375, -0.6009521484375, -0.48907470703125, -0.377197265625, -0.26531982421875, -0.1534423828125, -0.04156494140625, 0.0703125, 0.18218994140625, 0.2940673828125, 0.40594482421875, 0.517822265625, 0.62969970703125, 0.7415771484375, 0.85345458984375, 0.96533203125, 1.07720947265625, 1.1890869140625, 1.30096435546875, 1.412841796875, 1.52471923828125, 1.6365966796875, 1.74847412109375, 1.8603515625, 1.97222900390625, 2.0841064453125, 2.19598388671875, 2.307861328125, 2.41973876953125, 2.5316162109375, 2.64349365234375, 2.75537109375, 2.86724853515625, 2.9791259765625, 3.09100341796875, 3.202880859375, 3.31475830078125, 3.4266357421875, 3.53851318359375, 3.650390625]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 5.0, 9.0, 15.0, 19.0, 31.0, 78.0, 96.0, 215.0, 277.0, 446.0, 685.0, 1219.0, 1887.0, 2982.0, 4802.0, 7588.0, 11936.0, 19156.0, 30000.0, 47377.0, 73601.0, 110181.0, 148516.0, 1211482.0, 140107.0, 100719.0, 67169.0, 43015.0, 27496.0, 16985.0, 10812.0, 6888.0, 4241.0, 2692.0, 1684.0, 1054.0, 648.0, 403.0, 252.0, 144.0, 79.0, 57.0, 36.0, 16.0, 23.0, 7.0, 5.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.46044921875, -0.4457817077636719, -0.43111419677734375, -0.4164466857910156, -0.4017791748046875, -0.3871116638183594, -0.37244415283203125, -0.3577766418457031, -0.343109130859375, -0.3284416198730469, -0.31377410888671875, -0.2991065979003906, -0.2844390869140625, -0.2697715759277344, -0.25510406494140625, -0.24043655395507812, -0.22576904296875, -0.21110153198242188, -0.19643402099609375, -0.18176651000976562, -0.1670989990234375, -0.15243148803710938, -0.13776397705078125, -0.12309646606445312, -0.108428955078125, -0.09376144409179688, -0.07909393310546875, -0.06442642211914062, -0.0497589111328125, -0.035091400146484375, -0.02042388916015625, -0.005756378173828125, 0.0089111328125, 0.023578643798828125, 0.03824615478515625, 0.052913665771484375, 0.0675811767578125, 0.08224868774414062, 0.09691619873046875, 0.11158370971679688, 0.126251220703125, 0.14091873168945312, 0.15558624267578125, 0.17025375366210938, 0.1849212646484375, 0.19958877563476562, 0.21425628662109375, 0.22892379760742188, 0.24359130859375, 0.2582588195800781, 0.27292633056640625, 0.2875938415527344, 0.3022613525390625, 0.3169288635253906, 0.33159637451171875, 0.3462638854980469, 0.360931396484375, 0.3755989074707031, 0.39026641845703125, 0.4049339294433594, 0.4196014404296875, 0.4342689514160156, 0.44893646240234375, 0.4636039733886719, 0.478271484375]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 8.0, 3.0, 4.0, 4.0, 5.0, 10.0, 11.0, 15.0, 19.0, 21.0, 20.0, 17.0, 34.0, 32.0, 34.0, 45.0, 51.0, 67.0, 84.0, 72.0, 68.0, 56.0, 53.0, 37.0, 46.0, 39.0, 36.0, 27.0, 11.0, 12.0, 18.0, 10.0, 11.0, 6.0, 5.0, 5.0, 4.0, 1.0, 0.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0042572021484375, -0.004100680351257324, -0.0039441585540771484, -0.0037876367568969727, -0.003631114959716797, -0.003474593162536621, -0.0033180713653564453, -0.0031615495681762695, -0.0030050277709960938, -0.002848505973815918, -0.002691984176635742, -0.0025354623794555664, -0.0023789405822753906, -0.002222418785095215, -0.002065896987915039, -0.0019093751907348633, -0.0017528533935546875, -0.0015963315963745117, -0.001439809799194336, -0.0012832880020141602, -0.0011267662048339844, -0.0009702444076538086, -0.0008137226104736328, -0.000657200813293457, -0.0005006790161132812, -0.00034415721893310547, -0.0001876354217529297, -3.1113624572753906e-05, 0.00012540817260742188, 0.00028192996978759766, 0.00043845176696777344, 0.0005949735641479492, 0.000751495361328125, 0.0009080171585083008, 0.0010645389556884766, 0.0012210607528686523, 0.0013775825500488281, 0.001534104347229004, 0.0016906261444091797, 0.0018471479415893555, 0.0020036697387695312, 0.002160191535949707, 0.002316713333129883, 0.0024732351303100586, 0.0026297569274902344, 0.00278627872467041, 0.002942800521850586, 0.0030993223190307617, 0.0032558441162109375, 0.0034123659133911133, 0.003568887710571289, 0.003725409507751465, 0.0038819313049316406, 0.004038453102111816, 0.004194974899291992, 0.004351496696472168, 0.004508018493652344, 0.0046645402908325195, 0.004821062088012695, 0.004977583885192871, 0.005134105682373047, 0.005290627479553223, 0.0054471492767333984, 0.005603671073913574, 0.00576019287109375]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 1.0, 8.0, 3.0, 1.0, 10.0, 14.0, 12.0, 16.0, 20.0, 23.0, 27.0, 47.0, 64.0, 61.0, 95.0, 151.0, 230.0, 536.0, 4533.0, 844770.0, 194827.0, 2039.0, 414.0, 163.0, 109.0, 66.0, 62.0, 60.0, 28.0, 23.0, 38.0, 28.0, 15.0, 8.0, 15.0, 6.0, 5.0, 7.0, 2.0, 5.0, 7.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.11370849609375, -0.11062431335449219, -0.10754013061523438, -0.10445594787597656, -0.10137176513671875, -0.09828758239746094, -0.09520339965820312, -0.09211921691894531, -0.0890350341796875, -0.08595085144042969, -0.08286666870117188, -0.07978248596191406, -0.07669830322265625, -0.07361412048339844, -0.07052993774414062, -0.06744575500488281, -0.064361572265625, -0.06127738952636719, -0.058193206787109375, -0.05510902404785156, -0.05202484130859375, -0.04894065856933594, -0.045856475830078125, -0.04277229309082031, -0.0396881103515625, -0.03660392761230469, -0.033519744873046875, -0.030435562133789062, -0.02735137939453125, -0.024267196655273438, -0.021183013916015625, -0.018098831176757812, -0.0150146484375, -0.011930465698242188, -0.008846282958984375, -0.0057621002197265625, -0.00267791748046875, 0.0004062652587890625, 0.003490447998046875, 0.0065746307373046875, 0.0096588134765625, 0.012742996215820312, 0.015827178955078125, 0.018911361694335938, 0.02199554443359375, 0.025079727172851562, 0.028163909912109375, 0.031248092651367188, 0.034332275390625, 0.03741645812988281, 0.040500640869140625, 0.04358482360839844, 0.04666900634765625, 0.04975318908691406, 0.052837371826171875, 0.05592155456542969, 0.0590057373046875, 0.06208992004394531, 0.06517410278320312, 0.06825828552246094, 0.07134246826171875, 0.07442665100097656, 0.07751083374023438, 0.08059501647949219, 0.08367919921875]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [4.0, 5.0, 85.0, 678.0, 219.0, 25.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0032518741209059954, -0.002353122690692544, -0.0014543713768944144, -0.0005556200630962849, 0.0003431313671171665, 0.0012418825644999743, 0.0021406339947134256, 0.003039385424926877, 0.003938136622309685, 0.004836888052523136, 0.0057356394827365875, 0.006634390912950039, 0.00753314234316349, 0.008431892842054367, 0.009330645203590393, 0.01022939570248127, 0.011128148064017296, 0.012026899494230747, 0.012925650924444199, 0.01382440235465765, 0.014723153784871101, 0.015621904283761978, 0.016520656645298004, 0.01741940714418888, 0.018318159505724907, 0.019216910004615784, 0.02011566236615181, 0.021014412865042686, 0.021913165226578712, 0.02281191572546959, 0.023710668087005615, 0.024609418585896492, 0.025508170947432518, 0.026406921446323395, 0.02730567380785942, 0.028204424306750298, 0.029103176668286324, 0.0300019271671772, 0.030900679528713226, 0.03179943189024925, 0.03269818052649498, 0.033596932888031006, 0.03449568152427673, 0.03539443388581276, 0.036293186247348785, 0.03719193860888481, 0.03809068724513054, 0.038989439606666565, 0.03988819196820259, 0.04078694432973862, 0.041685692965984344, 0.04258444532752037, 0.043483197689056396, 0.04438195005059242, 0.04528069868683815, 0.046179451048374176, 0.0470782034099102, 0.04797695577144623, 0.048875704407691956, 0.04977445676922798, 0.05067320913076401, 0.051571961492300034, 0.05247071012854576, 0.05336946249008179, 0.05426821485161781]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 8.0, 5.0, 5.0, 14.0, 15.0, 12.0, 23.0, 26.0, 31.0, 32.0, 42.0, 38.0, 31.0, 37.0, 47.0, 54.0, 64.0, 55.0, 57.0, 54.0, 57.0, 47.0, 46.0, 36.0, 34.0, 23.0, 23.0, 26.0, 10.0, 8.0, 15.0, 7.0, 9.0, 6.0, 4.0, 0.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.004744350910186768, -0.004613455384969711, -0.004482559859752655, -0.004351664334535599, -0.0042207688093185425, -0.004089873284101486, -0.00395897775888443, -0.0038280822336673737, -0.0036971867084503174, -0.003566291183233261, -0.003435395658016205, -0.0033045001327991486, -0.0031736046075820923, -0.003042709082365036, -0.0029118135571479797, -0.0027809180319309235, -0.002650022506713867, -0.002519126981496811, -0.0023882314562797546, -0.0022573359310626984, -0.002126440405845642, -0.001995544880628586, -0.0018646493554115295, -0.0017337538301944733, -0.001602858304977417, -0.0014719627797603607, -0.0013410672545433044, -0.0012101717293262482, -0.001079276204109192, -0.0009483806788921356, -0.0008174851536750793, -0.0006865896284580231, -0.0005556941032409668, -0.0004247985780239105, -0.00029390305280685425, -0.00016300752758979797, -3.21120023727417e-05, 9.878352284431458e-05, 0.00022967904806137085, 0.0003605745732784271, 0.0004914700984954834, 0.0006223656237125397, 0.000753261148929596, 0.0008841566741466522, 0.0010150521993637085, 0.0011459477245807648, 0.001276843249797821, 0.0014077387750148773, 0.0015386343002319336, 0.0016695298254489899, 0.0018004253506660461, 0.0019313208758831024, 0.0020622164011001587, 0.002193111926317215, 0.0023240074515342712, 0.0024549029767513275, 0.002585798501968384, 0.00271669402718544, 0.0028475895524024963, 0.0029784850776195526, 0.003109380602836609, 0.003240276128053665, 0.0033711716532707214, 0.0035020671784877777, 0.003632962703704834]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 6.0, 13.0, 10.0, 6.0, 8.0, 11.0, 22.0, 15.0, 25.0, 22.0, 17.0, 21.0, 26.0, 31.0, 34.0, 36.0, 47.0, 40.0, 29.0, 44.0, 41.0, 32.0, 44.0, 43.0, 38.0, 34.0, 34.0, 37.0, 28.0, 25.0, 28.0, 20.0, 22.0, 21.0, 16.0, 17.0, 4.0, 7.0, 13.0, 4.0, 9.0, 6.0, 3.0, 5.0, 4.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.26171875, -5.07354736328125, -4.8853759765625, -4.69720458984375, -4.509033203125, -4.32086181640625, -4.1326904296875, -3.94451904296875, -3.75634765625, -3.56817626953125, -3.3800048828125, -3.19183349609375, -3.003662109375, -2.81549072265625, -2.6273193359375, -2.43914794921875, -2.2509765625, -2.06280517578125, -1.8746337890625, -1.68646240234375, -1.498291015625, -1.31011962890625, -1.1219482421875, -0.93377685546875, -0.74560546875, -0.55743408203125, -0.3692626953125, -0.18109130859375, 0.007080078125, 0.19525146484375, 0.3834228515625, 0.57159423828125, 0.759765625, 0.94793701171875, 1.1361083984375, 1.32427978515625, 1.512451171875, 1.70062255859375, 1.8887939453125, 2.07696533203125, 2.26513671875, 2.45330810546875, 2.6414794921875, 2.82965087890625, 3.017822265625, 3.20599365234375, 3.3941650390625, 3.58233642578125, 3.7705078125, 3.95867919921875, 4.1468505859375, 4.33502197265625, 4.523193359375, 4.71136474609375, 4.8995361328125, 5.08770751953125, 5.27587890625, 5.46405029296875, 5.6522216796875, 5.84039306640625, 6.028564453125, 6.21673583984375, 6.4049072265625, 6.59307861328125, 6.78125]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 0.0, 5.0, 5.0, 3.0, 7.0, 7.0, 9.0, 18.0, 23.0, 37.0, 43.0, 51.0, 85.0, 112.0, 200.0, 268.0, 480.0, 791.0, 1395.0, 2436.0, 4623.0, 8854.0, 18548.0, 43427.0, 120629.0, 387109.0, 298168.0, 93773.0, 35318.0, 15425.0, 7420.0, 3983.0, 2167.0, 1195.0, 722.0, 429.0, 251.0, 183.0, 111.0, 72.0, 58.0, 37.0, 28.0, 16.0, 17.0, 9.0, 9.0, 4.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.66015625, -4.50421142578125, -4.3482666015625, -4.19232177734375, -4.036376953125, -3.88043212890625, -3.7244873046875, -3.56854248046875, -3.41259765625, -3.25665283203125, -3.1007080078125, -2.94476318359375, -2.788818359375, -2.63287353515625, -2.4769287109375, -2.32098388671875, -2.1650390625, -2.00909423828125, -1.8531494140625, -1.69720458984375, -1.541259765625, -1.38531494140625, -1.2293701171875, -1.07342529296875, -0.91748046875, -0.76153564453125, -0.6055908203125, -0.44964599609375, -0.293701171875, -0.13775634765625, 0.0181884765625, 0.17413330078125, 0.330078125, 0.48602294921875, 0.6419677734375, 0.79791259765625, 0.953857421875, 1.10980224609375, 1.2657470703125, 1.42169189453125, 1.57763671875, 1.73358154296875, 1.8895263671875, 2.04547119140625, 2.201416015625, 2.35736083984375, 2.5133056640625, 2.66925048828125, 2.8251953125, 2.98114013671875, 3.1370849609375, 3.29302978515625, 3.448974609375, 3.60491943359375, 3.7608642578125, 3.91680908203125, 4.07275390625, 4.22869873046875, 4.3846435546875, 4.54058837890625, 4.696533203125, 4.85247802734375, 5.0084228515625, 5.16436767578125, 5.3203125]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 4.0, 7.0, 4.0, 11.0, 4.0, 12.0, 14.0, 17.0, 12.0, 15.0, 14.0, 21.0, 22.0, 20.0, 29.0, 34.0, 25.0, 43.0, 30.0, 54.0, 83.0, 235.0, 1648.0, 194.0, 67.0, 54.0, 48.0, 38.0, 39.0, 28.0, 30.0, 24.0, 32.0, 22.0, 17.0, 18.0, 11.0, 11.0, 18.0, 12.0, 8.0, 8.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-19.59375, -19.008056640625, -18.42236328125, -17.836669921875, -17.2509765625, -16.665283203125, -16.07958984375, -15.493896484375, -14.908203125, -14.322509765625, -13.73681640625, -13.151123046875, -12.5654296875, -11.979736328125, -11.39404296875, -10.808349609375, -10.22265625, -9.636962890625, -9.05126953125, -8.465576171875, -7.8798828125, -7.294189453125, -6.70849609375, -6.122802734375, -5.537109375, -4.951416015625, -4.36572265625, -3.780029296875, -3.1943359375, -2.608642578125, -2.02294921875, -1.437255859375, -0.8515625, -0.265869140625, 0.31982421875, 0.905517578125, 1.4912109375, 2.076904296875, 2.66259765625, 3.248291015625, 3.833984375, 4.419677734375, 5.00537109375, 5.591064453125, 6.1767578125, 6.762451171875, 7.34814453125, 7.933837890625, 8.51953125, 9.105224609375, 9.69091796875, 10.276611328125, 10.8623046875, 11.447998046875, 12.03369140625, 12.619384765625, 13.205078125, 13.790771484375, 14.37646484375, 14.962158203125, 15.5478515625, 16.133544921875, 16.71923828125, 17.304931640625, 17.890625]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 4.0, 3.0, 4.0, 6.0, 6.0, 5.0, 13.0, 11.0, 16.0, 28.0, 35.0, 43.0, 59.0, 87.0, 122.0, 172.0, 236.0, 362.0, 653.0, 7978.0, 3091226.0, 42388.0, 932.0, 392.0, 246.0, 181.0, 128.0, 86.0, 64.0, 50.0, 42.0, 30.0, 28.0, 15.0, 16.0, 13.0, 8.0, 4.0, 4.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-64.1875, -62.3876953125, -60.587890625, -58.7880859375, -56.98828125, -55.1884765625, -53.388671875, -51.5888671875, -49.7890625, -47.9892578125, -46.189453125, -44.3896484375, -42.58984375, -40.7900390625, -38.990234375, -37.1904296875, -35.390625, -33.5908203125, -31.791015625, -29.9912109375, -28.19140625, -26.3916015625, -24.591796875, -22.7919921875, -20.9921875, -19.1923828125, -17.392578125, -15.5927734375, -13.79296875, -11.9931640625, -10.193359375, -8.3935546875, -6.59375, -4.7939453125, -2.994140625, -1.1943359375, 0.60546875, 2.4052734375, 4.205078125, 6.0048828125, 7.8046875, 9.6044921875, 11.404296875, 13.2041015625, 15.00390625, 16.8037109375, 18.603515625, 20.4033203125, 22.203125, 24.0029296875, 25.802734375, 27.6025390625, 29.40234375, 31.2021484375, 33.001953125, 34.8017578125, 36.6015625, 38.4013671875, 40.201171875, 42.0009765625, 43.80078125, 45.6005859375, 47.400390625, 49.2001953125, 51.0]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [3.0, 4.0, 41.0, 400.0, 483.0, 82.0, 6.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.019357681274414, -9.892585754394531, -6.76581335067749, -3.639040946960449, -0.5122690200805664, 2.6145029067993164, 5.741275787353516, 8.868047714233398, 11.994819641113281, 15.121591567993164, 18.248363494873047, 21.375137329101562, 24.501907348632812, 27.628681182861328, 30.75545310974121, 33.882225036621094, 37.008995056152344, 40.13576889038086, 43.26253890991211, 46.389312744140625, 49.516082763671875, 52.64285659790039, 55.769630432128906, 58.896400451660156, 62.02317428588867, 65.14994812011719, 68.27671813964844, 71.40348815917969, 74.53026580810547, 77.65703582763672, 80.78380584716797, 83.91058349609375, 87.03734588623047, 90.16411590576172, 93.2908935546875, 96.41766357421875, 99.54443359375, 102.67120361328125, 105.79798126220703, 108.92475128173828, 112.05152130126953, 115.17829132080078, 118.30506896972656, 121.43183898925781, 124.55860900878906, 127.68537902832031, 130.81214904785156, 133.93893432617188, 137.06570434570312, 140.19247436523438, 143.31924438476562, 146.44601440429688, 149.5727996826172, 152.69956970214844, 155.8263397216797, 158.95310974121094, 162.0798797607422, 165.20664978027344, 168.3334197998047, 171.46018981933594, 174.58697509765625, 177.7137451171875, 180.84051513671875, 183.96728515625, 187.09405517578125]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 5.0, 5.0, 14.0, 4.0, 12.0, 14.0, 12.0, 16.0, 22.0, 22.0, 28.0, 27.0, 32.0, 32.0, 33.0, 54.0, 44.0, 40.0, 55.0, 34.0, 66.0, 52.0, 44.0, 43.0, 31.0, 41.0, 34.0, 24.0, 38.0, 33.0, 23.0, 17.0, 14.0, 10.0, 8.0, 6.0, 6.0, 4.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.58349609375, -51.70321273803711, -49.82292556762695, -47.94264221191406, -46.062355041503906, -44.182071685791016, -42.301788330078125, -40.42150115966797, -38.54121780395508, -36.66093444824219, -34.78064727783203, -32.90036392211914, -31.020078659057617, -29.139793395996094, -27.25950813293457, -25.379222869873047, -23.498937606811523, -21.61865234375, -19.738367080688477, -17.858081817626953, -15.977798461914062, -14.097513198852539, -12.217227935791016, -10.336943626403809, -8.456658363342285, -6.57637357711792, -4.696088790893555, -2.8158035278320312, -0.935518741607666, 0.9447660446166992, 2.8250513076782227, 4.70533561706543, 6.585620880126953, 8.465906143188477, 10.346190452575684, 12.226475715637207, 14.106760025024414, 15.987045288085938, 17.86733055114746, 19.747615814208984, 21.627899169921875, 23.5081844329834, 25.388469696044922, 27.268753051757812, 29.149038314819336, 31.02932357788086, 32.90960693359375, 34.789894104003906, 36.67018127441406, 38.55046463012695, 40.43075180053711, 42.31103515625, 44.191322326660156, 46.07160568237305, 47.95188903808594, 49.832176208496094, 51.712459564208984, 53.592742919921875, 55.47303009033203, 57.35331344604492, 59.23360061645508, 61.11388397216797, 62.994171142578125, 64.87445068359375, 66.7547378540039]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 9.0, 9.0, 9.0, 11.0, 10.0, 6.0, 10.0, 20.0, 27.0, 19.0, 17.0, 23.0, 25.0, 40.0, 36.0, 38.0, 34.0, 35.0, 40.0, 44.0, 38.0, 50.0, 40.0, 38.0, 33.0, 34.0, 40.0, 36.0, 24.0, 25.0, 30.0, 21.0, 19.0, 15.0, 21.0, 15.0, 9.0, 12.0, 6.0, 9.0, 2.0, 7.0, 7.0, 5.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.57421875, -5.37542724609375, -5.1766357421875, -4.97784423828125, -4.779052734375, -4.58026123046875, -4.3814697265625, -4.18267822265625, -3.98388671875, -3.78509521484375, -3.5863037109375, -3.38751220703125, -3.188720703125, -2.98992919921875, -2.7911376953125, -2.59234619140625, -2.3935546875, -2.19476318359375, -1.9959716796875, -1.79718017578125, -1.598388671875, -1.39959716796875, -1.2008056640625, -1.00201416015625, -0.80322265625, -0.60443115234375, -0.4056396484375, -0.20684814453125, -0.008056640625, 0.19073486328125, 0.3895263671875, 0.58831787109375, 0.787109375, 0.98590087890625, 1.1846923828125, 1.38348388671875, 1.582275390625, 1.78106689453125, 1.9798583984375, 2.17864990234375, 2.37744140625, 2.57623291015625, 2.7750244140625, 2.97381591796875, 3.172607421875, 3.37139892578125, 3.5701904296875, 3.76898193359375, 3.9677734375, 4.16656494140625, 4.3653564453125, 4.56414794921875, 4.762939453125, 4.96173095703125, 5.1605224609375, 5.35931396484375, 5.55810546875, 5.75689697265625, 5.9556884765625, 6.15447998046875, 6.353271484375, 6.55206298828125, 6.7508544921875, 6.94964599609375, 7.1484375]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 6.0, 2.0, 8.0, 14.0, 8.0, 10.0, 4.0, 16.0, 18.0, 15.0, 19.0, 32.0, 28.0, 55.0, 97.0, 199.0, 411.0, 836.0, 2198.0, 7793.0, 50624.0, 836289.0, 2848255.0, 411251.0, 27704.0, 5316.0, 1644.0, 659.0, 297.0, 139.0, 97.0, 60.0, 39.0, 31.0, 34.0, 13.0, 9.0, 11.0, 9.0, 6.0, 7.0, 10.0, 6.0, 4.0, 4.0, 3.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.140625, -13.6044921875, -13.068359375, -12.5322265625, -11.99609375, -11.4599609375, -10.923828125, -10.3876953125, -9.8515625, -9.3154296875, -8.779296875, -8.2431640625, -7.70703125, -7.1708984375, -6.634765625, -6.0986328125, -5.5625, -5.0263671875, -4.490234375, -3.9541015625, -3.41796875, -2.8818359375, -2.345703125, -1.8095703125, -1.2734375, -0.7373046875, -0.201171875, 0.3349609375, 0.87109375, 1.4072265625, 1.943359375, 2.4794921875, 3.015625, 3.5517578125, 4.087890625, 4.6240234375, 5.16015625, 5.6962890625, 6.232421875, 6.7685546875, 7.3046875, 7.8408203125, 8.376953125, 8.9130859375, 9.44921875, 9.9853515625, 10.521484375, 11.0576171875, 11.59375, 12.1298828125, 12.666015625, 13.2021484375, 13.73828125, 14.2744140625, 14.810546875, 15.3466796875, 15.8828125, 16.4189453125, 16.955078125, 17.4912109375, 18.02734375, 18.5634765625, 19.099609375, 19.6357421875, 20.171875]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 7.0, 3.0, 7.0, 8.0, 7.0, 13.0, 14.0, 29.0, 24.0, 43.0, 37.0, 57.0, 69.0, 102.0, 145.0, 135.0, 216.0, 295.0, 341.0, 403.0, 413.0, 393.0, 311.0, 251.0, 166.0, 145.0, 109.0, 86.0, 52.0, 51.0, 33.0, 35.0, 20.0, 18.0, 8.0, 8.0, 8.0, 4.0, 4.0, 2.0, 5.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.3203125, -8.9642333984375, -8.608154296875, -8.2520751953125, -7.89599609375, -7.5399169921875, -7.183837890625, -6.8277587890625, -6.4716796875, -6.1156005859375, -5.759521484375, -5.4034423828125, -5.04736328125, -4.6912841796875, -4.335205078125, -3.9791259765625, -3.623046875, -3.2669677734375, -2.910888671875, -2.5548095703125, -2.19873046875, -1.8426513671875, -1.486572265625, -1.1304931640625, -0.7744140625, -0.4183349609375, -0.062255859375, 0.2938232421875, 0.64990234375, 1.0059814453125, 1.362060546875, 1.7181396484375, 2.07421875, 2.4302978515625, 2.786376953125, 3.1424560546875, 3.49853515625, 3.8546142578125, 4.210693359375, 4.5667724609375, 4.9228515625, 5.2789306640625, 5.635009765625, 5.9910888671875, 6.34716796875, 6.7032470703125, 7.059326171875, 7.4154052734375, 7.771484375, 8.1275634765625, 8.483642578125, 8.8397216796875, 9.19580078125, 9.5518798828125, 9.907958984375, 10.2640380859375, 10.6201171875, 10.9761962890625, 11.332275390625, 11.6883544921875, 12.04443359375, 12.4005126953125, 12.756591796875, 13.1126708984375, 13.46875]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 6.0, 10.0, 7.0, 7.0, 7.0, 16.0, 25.0, 24.0, 34.0, 55.0, 67.0, 55.0, 90.0, 101.0, 131.0, 169.0, 250.0, 329.0, 617.0, 4472.0, 229493.0, 3860920.0, 92858.0, 2607.0, 558.0, 300.0, 234.0, 178.0, 149.0, 93.0, 90.0, 77.0, 56.0, 40.0, 28.0, 35.0, 19.0, 21.0, 14.0, 10.0, 9.0, 9.0, 3.0, 6.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-46.28125, -44.93603515625, -43.5908203125, -42.24560546875, -40.900390625, -39.55517578125, -38.2099609375, -36.86474609375, -35.51953125, -34.17431640625, -32.8291015625, -31.48388671875, -30.138671875, -28.79345703125, -27.4482421875, -26.10302734375, -24.7578125, -23.41259765625, -22.0673828125, -20.72216796875, -19.376953125, -18.03173828125, -16.6865234375, -15.34130859375, -13.99609375, -12.65087890625, -11.3056640625, -9.96044921875, -8.615234375, -7.27001953125, -5.9248046875, -4.57958984375, -3.234375, -1.88916015625, -0.5439453125, 0.80126953125, 2.146484375, 3.49169921875, 4.8369140625, 6.18212890625, 7.52734375, 8.87255859375, 10.2177734375, 11.56298828125, 12.908203125, 14.25341796875, 15.5986328125, 16.94384765625, 18.2890625, 19.63427734375, 20.9794921875, 22.32470703125, 23.669921875, 25.01513671875, 26.3603515625, 27.70556640625, 29.05078125, 30.39599609375, 31.7412109375, 33.08642578125, 34.431640625, 35.77685546875, 37.1220703125, 38.46728515625, 39.8125]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 14.0, 27.0, 47.0, 74.0, 132.0, 157.0, 147.0, 126.0, 129.0, 76.0, 42.0, 20.0, 5.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.3076171875, -63.020355224609375, -60.73309326171875, -58.445831298828125, -56.1585693359375, -53.871307373046875, -51.58404541015625, -49.296783447265625, -47.009521484375, -44.722259521484375, -42.43499755859375, -40.147735595703125, -37.8604736328125, -35.573211669921875, -33.28594970703125, -30.998687744140625, -28.71142578125, -26.424163818359375, -24.13690185546875, -21.849639892578125, -19.5623779296875, -17.275115966796875, -14.98785400390625, -12.700592041015625, -10.413330078125, -8.126068115234375, -5.83880615234375, -3.551544189453125, -1.2642822265625, 1.022979736328125, 3.31024169921875, 5.597503662109375, 7.884765625, 10.172027587890625, 12.45928955078125, 14.746551513671875, 17.0338134765625, 19.321075439453125, 21.60833740234375, 23.895599365234375, 26.182861328125, 28.470123291015625, 30.75738525390625, 33.044647216796875, 35.3319091796875, 37.619171142578125, 39.90643310546875, 42.193695068359375, 44.48095703125, 46.768218994140625, 49.05548095703125, 51.342742919921875, 53.6300048828125, 55.917266845703125, 58.20452880859375, 60.491790771484375, 62.779052734375, 65.06631469726562, 67.35357666015625, 69.64083862304688, 71.9281005859375, 74.21536254882812, 76.50262451171875, 78.78988647460938, 81.0771484375]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 3.0, 5.0, 5.0, 7.0, 6.0, 11.0, 15.0, 23.0, 21.0, 17.0, 15.0, 24.0, 28.0, 20.0, 48.0, 27.0, 34.0, 36.0, 41.0, 50.0, 40.0, 38.0, 40.0, 36.0, 43.0, 38.0, 40.0, 31.0, 36.0, 37.0, 31.0, 27.0, 17.0, 19.0, 18.0, 18.0, 7.0, 12.0, 12.0, 5.0, 5.0, 2.0, 3.0, 5.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-39.99188232421875, -38.7181282043457, -37.44437026977539, -36.170616149902344, -34.89685821533203, -33.623104095458984, -32.34934997558594, -31.075593948364258, -29.801837921142578, -28.5280818939209, -27.25432586669922, -25.980571746826172, -24.706815719604492, -23.433059692382812, -22.159305572509766, -20.885549545288086, -19.611793518066406, -18.338037490844727, -17.064281463623047, -15.79052734375, -14.51677131652832, -13.24301528930664, -11.969260215759277, -10.695505142211914, -9.421749114990234, -8.147993087768555, -6.874238014221191, -5.60048246383667, -4.326726913452148, -3.052971363067627, -1.7792158126831055, -0.5054607391357422, 0.7682952880859375, 2.042050838470459, 3.3158063888549805, 4.589561939239502, 5.863317489624023, 7.137073040008545, 8.410828590393066, 9.68458366394043, 10.95833969116211, 12.232095718383789, 13.505850791931152, 14.779605865478516, 16.053361892700195, 17.327117919921875, 18.600872039794922, 19.8746280670166, 21.14838409423828, 22.42214012145996, 23.69589614868164, 24.969650268554688, 26.243406295776367, 27.517162322998047, 28.790916442871094, 30.064672470092773, 31.338428497314453, 32.6121826171875, 33.88594055175781, 35.15969467163086, 36.433448791503906, 37.70720672607422, 38.980960845947266, 40.25471496582031, 41.528472900390625]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 5.0, 2.0, 9.0, 3.0, 13.0, 11.0, 11.0, 11.0, 17.0, 16.0, 24.0, 30.0, 21.0, 20.0, 34.0, 27.0, 34.0, 51.0, 33.0, 48.0, 48.0, 42.0, 44.0, 47.0, 32.0, 34.0, 42.0, 27.0, 30.0, 35.0, 32.0, 23.0, 16.0, 21.0, 20.0, 21.0, 13.0, 12.0, 8.0, 10.0, 8.0, 3.0, 3.0, 6.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.8125, -5.6124267578125, -5.412353515625, -5.2122802734375, -5.01220703125, -4.8121337890625, -4.612060546875, -4.4119873046875, -4.2119140625, -4.0118408203125, -3.811767578125, -3.6116943359375, -3.41162109375, -3.2115478515625, -3.011474609375, -2.8114013671875, -2.611328125, -2.4112548828125, -2.211181640625, -2.0111083984375, -1.81103515625, -1.6109619140625, -1.410888671875, -1.2108154296875, -1.0107421875, -0.8106689453125, -0.610595703125, -0.4105224609375, -0.21044921875, -0.0103759765625, 0.189697265625, 0.3897705078125, 0.58984375, 0.7899169921875, 0.989990234375, 1.1900634765625, 1.39013671875, 1.5902099609375, 1.790283203125, 1.9903564453125, 2.1904296875, 2.3905029296875, 2.590576171875, 2.7906494140625, 2.99072265625, 3.1907958984375, 3.390869140625, 3.5909423828125, 3.791015625, 3.9910888671875, 4.191162109375, 4.3912353515625, 4.59130859375, 4.7913818359375, 4.991455078125, 5.1915283203125, 5.3916015625, 5.5916748046875, 5.791748046875, 5.9918212890625, 6.19189453125, 6.3919677734375, 6.592041015625, 6.7921142578125, 6.9921875]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 3.0, 3.0, 5.0, 5.0, 13.0, 19.0, 26.0, 31.0, 70.0, 78.0, 110.0, 144.0, 218.0, 341.0, 498.0, 766.0, 1303.0, 1857.0, 2991.0, 4596.0, 7614.0, 11941.0, 19602.0, 32285.0, 52291.0, 85690.0, 137511.0, 189870.0, 179952.0, 122308.0, 76040.0, 46355.0, 27897.0, 17194.0, 10700.0, 6607.0, 4202.0, 2504.0, 1657.0, 1151.0, 701.0, 440.0, 302.0, 210.0, 147.0, 108.0, 62.0, 48.0, 27.0, 22.0, 21.0, 3.0, 14.0, 4.0, 7.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.6435546875, -0.62200927734375, -0.6004638671875, -0.57891845703125, -0.557373046875, -0.53582763671875, -0.5142822265625, -0.49273681640625, -0.47119140625, -0.44964599609375, -0.4281005859375, -0.40655517578125, -0.385009765625, -0.36346435546875, -0.3419189453125, -0.32037353515625, -0.298828125, -0.27728271484375, -0.2557373046875, -0.23419189453125, -0.212646484375, -0.19110107421875, -0.1695556640625, -0.14801025390625, -0.12646484375, -0.10491943359375, -0.0833740234375, -0.06182861328125, -0.040283203125, -0.01873779296875, 0.0028076171875, 0.02435302734375, 0.0458984375, 0.06744384765625, 0.0889892578125, 0.11053466796875, 0.132080078125, 0.15362548828125, 0.1751708984375, 0.19671630859375, 0.21826171875, 0.23980712890625, 0.2613525390625, 0.28289794921875, 0.304443359375, 0.32598876953125, 0.3475341796875, 0.36907958984375, 0.390625, 0.41217041015625, 0.4337158203125, 0.45526123046875, 0.476806640625, 0.49835205078125, 0.5198974609375, 0.54144287109375, 0.56298828125, 0.58453369140625, 0.6060791015625, 0.62762451171875, 0.649169921875, 0.67071533203125, 0.6922607421875, 0.71380615234375, 0.7353515625]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 4.0, 4.0, 5.0, 11.0, 10.0, 5.0, 5.0, 7.0, 14.0, 19.0, 20.0, 13.0, 21.0, 13.0, 22.0, 29.0, 25.0, 22.0, 34.0, 34.0, 38.0, 29.0, 32.0, 36.0, 43.0, 1058.0, 38.0, 32.0, 33.0, 27.0, 39.0, 41.0, 27.0, 27.0, 23.0, 26.0, 16.0, 28.0, 13.0, 22.0, 13.0, 11.0, 10.0, 6.0, 13.0, 12.0, 4.0, 6.0, 8.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 3.0], "bins": [-3.955078125, -3.83673095703125, -3.7183837890625, -3.60003662109375, -3.481689453125, -3.36334228515625, -3.2449951171875, -3.12664794921875, -3.00830078125, -2.88995361328125, -2.7716064453125, -2.65325927734375, -2.534912109375, -2.41656494140625, -2.2982177734375, -2.17987060546875, -2.0615234375, -1.94317626953125, -1.8248291015625, -1.70648193359375, -1.588134765625, -1.46978759765625, -1.3514404296875, -1.23309326171875, -1.11474609375, -0.99639892578125, -0.8780517578125, -0.75970458984375, -0.641357421875, -0.52301025390625, -0.4046630859375, -0.28631591796875, -0.16796875, -0.04962158203125, 0.0687255859375, 0.18707275390625, 0.305419921875, 0.42376708984375, 0.5421142578125, 0.66046142578125, 0.77880859375, 0.89715576171875, 1.0155029296875, 1.13385009765625, 1.252197265625, 1.37054443359375, 1.4888916015625, 1.60723876953125, 1.7255859375, 1.84393310546875, 1.9622802734375, 2.08062744140625, 2.198974609375, 2.31732177734375, 2.4356689453125, 2.55401611328125, 2.67236328125, 2.79071044921875, 2.9090576171875, 3.02740478515625, 3.145751953125, 3.26409912109375, 3.3824462890625, 3.50079345703125, 3.619140625]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 6.0, 11.0, 12.0, 26.0, 26.0, 54.0, 83.0, 121.0, 236.0, 364.0, 551.0, 990.0, 1532.0, 2555.0, 4221.0, 6958.0, 11293.0, 18404.0, 29953.0, 48489.0, 77285.0, 117860.0, 162251.0, 1220772.0, 139291.0, 94775.0, 61097.0, 37769.0, 23318.0, 14570.0, 8713.0, 5330.0, 3175.0, 1972.0, 1229.0, 747.0, 390.0, 260.0, 167.0, 88.0, 63.0, 44.0, 28.0, 16.0, 18.0, 8.0, 6.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.5322265625, -0.515716552734375, -0.49920654296875, -0.482696533203125, -0.4661865234375, -0.449676513671875, -0.43316650390625, -0.416656494140625, -0.400146484375, -0.383636474609375, -0.36712646484375, -0.350616455078125, -0.3341064453125, -0.317596435546875, -0.30108642578125, -0.284576416015625, -0.26806640625, -0.251556396484375, -0.23504638671875, -0.218536376953125, -0.2020263671875, -0.185516357421875, -0.16900634765625, -0.152496337890625, -0.135986328125, -0.119476318359375, -0.10296630859375, -0.086456298828125, -0.0699462890625, -0.053436279296875, -0.03692626953125, -0.020416259765625, -0.00390625, 0.012603759765625, 0.02911376953125, 0.045623779296875, 0.0621337890625, 0.078643798828125, 0.09515380859375, 0.111663818359375, 0.128173828125, 0.144683837890625, 0.16119384765625, 0.177703857421875, 0.1942138671875, 0.210723876953125, 0.22723388671875, 0.243743896484375, 0.26025390625, 0.276763916015625, 0.29327392578125, 0.309783935546875, 0.3262939453125, 0.342803955078125, 0.35931396484375, 0.375823974609375, 0.392333984375, 0.408843994140625, 0.42535400390625, 0.441864013671875, 0.4583740234375, 0.474884033203125, 0.49139404296875, 0.507904052734375, 0.5244140625]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 6.0, 14.0, 6.0, 4.0, 12.0, 8.0, 14.0, 32.0, 30.0, 21.0, 55.0, 48.0, 71.0, 81.0, 83.0, 77.0, 78.0, 81.0, 53.0, 57.0, 45.0, 30.0, 25.0, 16.0, 14.0, 9.0, 6.0, 6.0, 3.0, 5.0, 3.0, 3.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.005512237548828125, -0.005355119705200195, -0.005198001861572266, -0.005040884017944336, -0.004883766174316406, -0.0047266483306884766, -0.004569530487060547, -0.004412412643432617, -0.0042552947998046875, -0.004098176956176758, -0.003941059112548828, -0.0037839412689208984, -0.0036268234252929688, -0.003469705581665039, -0.0033125877380371094, -0.0031554698944091797, -0.00299835205078125, -0.0028412342071533203, -0.0026841163635253906, -0.002526998519897461, -0.0023698806762695312, -0.0022127628326416016, -0.002055644989013672, -0.0018985271453857422, -0.0017414093017578125, -0.0015842914581298828, -0.0014271736145019531, -0.0012700557708740234, -0.0011129379272460938, -0.0009558200836181641, -0.0007987022399902344, -0.0006415843963623047, -0.000484466552734375, -0.0003273487091064453, -0.00017023086547851562, -1.3113021850585938e-05, 0.00014400482177734375, 0.00030112266540527344, 0.0004582405090332031, 0.0006153583526611328, 0.0007724761962890625, 0.0009295940399169922, 0.0010867118835449219, 0.0012438297271728516, 0.0014009475708007812, 0.001558065414428711, 0.0017151832580566406, 0.0018723011016845703, 0.0020294189453125, 0.0021865367889404297, 0.0023436546325683594, 0.002500772476196289, 0.0026578903198242188, 0.0028150081634521484, 0.002972126007080078, 0.003129243850708008, 0.0032863616943359375, 0.003443479537963867, 0.003600597381591797, 0.0037577152252197266, 0.003914833068847656, 0.004071950912475586, 0.004229068756103516, 0.004386186599731445, 0.004543304443359375]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 9.0, 3.0, 8.0, 6.0, 5.0, 15.0, 19.0, 24.0, 35.0, 42.0, 76.0, 106.0, 164.0, 375.0, 3955.0, 1030283.0, 12376.0, 473.0, 190.0, 119.0, 77.0, 45.0, 41.0, 27.0, 16.0, 10.0, 10.0, 10.0, 9.0, 8.0, 7.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1015625, -0.09801101684570312, -0.09445953369140625, -0.09090805053710938, -0.0873565673828125, -0.08380508422851562, -0.08025360107421875, -0.07670211791992188, -0.073150634765625, -0.06959915161132812, -0.06604766845703125, -0.062496185302734375, -0.0589447021484375, -0.055393218994140625, -0.05184173583984375, -0.048290252685546875, -0.04473876953125, -0.041187286376953125, -0.03763580322265625, -0.034084320068359375, -0.0305328369140625, -0.026981353759765625, -0.02342987060546875, -0.019878387451171875, -0.016326904296875, -0.012775421142578125, -0.00922393798828125, -0.005672454833984375, -0.0021209716796875, 0.001430511474609375, 0.00498199462890625, 0.008533477783203125, 0.0120849609375, 0.015636444091796875, 0.01918792724609375, 0.022739410400390625, 0.0262908935546875, 0.029842376708984375, 0.03339385986328125, 0.036945343017578125, 0.040496826171875, 0.044048309326171875, 0.04759979248046875, 0.051151275634765625, 0.0547027587890625, 0.058254241943359375, 0.06180572509765625, 0.06535720825195312, 0.06890869140625, 0.07246017456054688, 0.07601165771484375, 0.07956314086914062, 0.0831146240234375, 0.08666610717773438, 0.09021759033203125, 0.09376907348632812, 0.097320556640625, 0.10087203979492188, 0.10442352294921875, 0.10797500610351562, 0.1115264892578125, 0.11507797241210938, 0.11862945556640625, 0.12218093872070312, 0.125732421875]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [33.0, 727.0, 244.0, 13.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015578450402244925, -0.0006737327785231173, 0.00021037948317825794, 0.001094491803087294, 0.0019786041229963303, 0.002862716093659401, 0.003746828529983759, 0.00463094050064683, 0.005515052936971188, 0.006399165373295546, 0.007283277343958616, 0.008167389780282974, 0.009051501750946045, 0.009935613721609116, 0.010819726623594761, 0.011703838594257832, 0.012587951496243477, 0.013472063466906548, 0.014356176368892193, 0.015240288339555264, 0.01612440124154091, 0.01700851321220398, 0.01789262518286705, 0.01877673715353012, 0.01966084912419319, 0.020544961094856262, 0.021429073065519333, 0.022313185036182404, 0.023197298869490623, 0.024081410840153694, 0.024965522810816765, 0.025849634781479836, 0.026733746752142906, 0.027617858722805977, 0.028501970693469048, 0.029386084526777267, 0.030270196497440338, 0.03115430846810341, 0.03203842043876648, 0.03292253240942955, 0.03380664438009262, 0.03469075635075569, 0.03557486832141876, 0.03645898029208183, 0.037343092262744904, 0.038227204233407974, 0.039111316204071045, 0.039995431900024414, 0.040879543870687485, 0.041763655841350555, 0.042647767812013626, 0.0435318797826767, 0.04441599175333977, 0.04530010372400284, 0.04618421941995621, 0.04706832766532898, 0.04795243963599205, 0.04883655160665512, 0.04972066357731819, 0.05060477554798126, 0.05148888751864433, 0.052372999489307404, 0.05325711518526077, 0.054141223430633545, 0.055025339126586914]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 4.0, 3.0, 6.0, 10.0, 13.0, 25.0, 27.0, 25.0, 36.0, 31.0, 44.0, 32.0, 38.0, 64.0, 59.0, 47.0, 48.0, 59.0, 58.0, 55.0, 45.0, 44.0, 39.0, 32.0, 24.0, 24.0, 20.0, 21.0, 19.0, 21.0, 15.0, 7.0, 2.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0031934380531311035, -0.0031006978824734688, -0.003007957711815834, -0.0029152175411581993, -0.0028224773705005646, -0.00272973719984293, -0.002636997029185295, -0.0025442568585276604, -0.0024515166878700256, -0.002358776517212391, -0.002266036346554756, -0.0021732961758971214, -0.0020805560052394867, -0.001987815834581852, -0.0018950756639242172, -0.0018023354932665825, -0.0017095953226089478, -0.001616855151951313, -0.0015241149812936783, -0.0014313748106360435, -0.0013386346399784088, -0.001245894469320774, -0.0011531542986631393, -0.0010604141280055046, -0.0009676739573478699, -0.0008749337866902351, -0.0007821936160326004, -0.0006894534453749657, -0.0005967132747173309, -0.0005039731040596962, -0.00041123293340206146, -0.00031849276274442673, -0.000225752592086792, -0.00013301242142915726, -4.027225077152252e-05, 5.246791988611221e-05, 0.00014520809054374695, 0.00023794826120138168, 0.0003306884318590164, 0.00042342860251665115, 0.0005161687731742859, 0.0006089089438319206, 0.0007016491144895554, 0.0007943892851471901, 0.0008871294558048248, 0.0009798696264624596, 0.0010726097971200943, 0.001165349967777729, 0.0012580901384353638, 0.0013508303090929985, 0.0014435704797506332, 0.001536310650408268, 0.0016290508210659027, 0.0017217909917235374, 0.0018145311623811722, 0.001907271333038807, 0.0020000115036964417, 0.0020927516743540764, 0.002185491845011711, 0.002278232015669346, 0.0023709721863269806, 0.0024637123569846153, 0.00255645252764225, 0.002649192698299885, 0.0027419328689575195]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 5.0, 2.0, 9.0, 3.0, 13.0, 11.0, 11.0, 11.0, 17.0, 16.0, 24.0, 30.0, 21.0, 20.0, 34.0, 27.0, 34.0, 51.0, 33.0, 48.0, 47.0, 43.0, 44.0, 47.0, 32.0, 34.0, 42.0, 27.0, 30.0, 35.0, 32.0, 23.0, 16.0, 21.0, 20.0, 21.0, 13.0, 12.0, 8.0, 10.0, 8.0, 3.0, 3.0, 6.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.8125, -5.6124267578125, -5.412353515625, -5.2122802734375, -5.01220703125, -4.8121337890625, -4.612060546875, -4.4119873046875, -4.2119140625, -4.0118408203125, -3.811767578125, -3.6116943359375, -3.41162109375, -3.2115478515625, -3.011474609375, -2.8114013671875, -2.611328125, -2.4112548828125, -2.211181640625, -2.0111083984375, -1.81103515625, -1.6109619140625, -1.410888671875, -1.2108154296875, -1.0107421875, -0.8106689453125, -0.610595703125, -0.4105224609375, -0.21044921875, -0.0103759765625, 0.189697265625, 0.3897705078125, 0.58984375, 0.7899169921875, 0.989990234375, 1.1900634765625, 1.39013671875, 1.5902099609375, 1.790283203125, 1.9903564453125, 2.1904296875, 2.3905029296875, 2.590576171875, 2.7906494140625, 2.99072265625, 3.1907958984375, 3.390869140625, 3.5909423828125, 3.791015625, 3.9910888671875, 4.191162109375, 4.3912353515625, 4.59130859375, 4.7913818359375, 4.991455078125, 5.1915283203125, 5.3916015625, 5.5916748046875, 5.791748046875, 5.9918212890625, 6.19189453125, 6.3919677734375, 6.592041015625, 6.7921142578125, 6.9921875]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 7.0, 4.0, 9.0, 7.0, 16.0, 15.0, 21.0, 24.0, 44.0, 39.0, 73.0, 128.0, 152.0, 252.0, 432.0, 787.0, 1481.0, 3160.0, 7529.0, 20845.0, 80455.0, 371038.0, 431717.0, 91772.0, 23355.0, 8045.0, 3340.0, 1693.0, 842.0, 446.0, 282.0, 168.0, 105.0, 68.0, 51.0, 37.0, 36.0, 22.0, 12.0, 16.0, 9.0, 4.0, 4.0, 6.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.60546875, -5.4124755859375, -5.219482421875, -5.0264892578125, -4.83349609375, -4.6405029296875, -4.447509765625, -4.2545166015625, -4.0615234375, -3.8685302734375, -3.675537109375, -3.4825439453125, -3.28955078125, -3.0965576171875, -2.903564453125, -2.7105712890625, -2.517578125, -2.3245849609375, -2.131591796875, -1.9385986328125, -1.74560546875, -1.5526123046875, -1.359619140625, -1.1666259765625, -0.9736328125, -0.7806396484375, -0.587646484375, -0.3946533203125, -0.20166015625, -0.0086669921875, 0.184326171875, 0.3773193359375, 0.5703125, 0.7633056640625, 0.956298828125, 1.1492919921875, 1.34228515625, 1.5352783203125, 1.728271484375, 1.9212646484375, 2.1142578125, 2.3072509765625, 2.500244140625, 2.6932373046875, 2.88623046875, 3.0792236328125, 3.272216796875, 3.4652099609375, 3.658203125, 3.8511962890625, 4.044189453125, 4.2371826171875, 4.43017578125, 4.6231689453125, 4.816162109375, 5.0091552734375, 5.2021484375, 5.3951416015625, 5.588134765625, 5.7811279296875, 5.97412109375, 6.1671142578125, 6.360107421875, 6.5531005859375, 6.74609375]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 7.0, 5.0, 11.0, 10.0, 8.0, 9.0, 11.0, 20.0, 17.0, 14.0, 19.0, 17.0, 31.0, 28.0, 29.0, 26.0, 38.0, 32.0, 52.0, 47.0, 89.0, 347.0, 1567.0, 139.0, 69.0, 41.0, 38.0, 35.0, 33.0, 30.0, 29.0, 40.0, 18.0, 22.0, 25.0, 22.0, 6.0, 10.0, 9.0, 5.0, 5.0, 11.0, 7.0, 8.0, 2.0, 5.0, 3.0, 4.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0], "bins": [-19.421875, -18.818359375, -18.21484375, -17.611328125, -17.0078125, -16.404296875, -15.80078125, -15.197265625, -14.59375, -13.990234375, -13.38671875, -12.783203125, -12.1796875, -11.576171875, -10.97265625, -10.369140625, -9.765625, -9.162109375, -8.55859375, -7.955078125, -7.3515625, -6.748046875, -6.14453125, -5.541015625, -4.9375, -4.333984375, -3.73046875, -3.126953125, -2.5234375, -1.919921875, -1.31640625, -0.712890625, -0.109375, 0.494140625, 1.09765625, 1.701171875, 2.3046875, 2.908203125, 3.51171875, 4.115234375, 4.71875, 5.322265625, 5.92578125, 6.529296875, 7.1328125, 7.736328125, 8.33984375, 8.943359375, 9.546875, 10.150390625, 10.75390625, 11.357421875, 11.9609375, 12.564453125, 13.16796875, 13.771484375, 14.375, 14.978515625, 15.58203125, 16.185546875, 16.7890625, 17.392578125, 17.99609375, 18.599609375, 19.203125]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 2.0, 5.0, 11.0, 16.0, 17.0, 19.0, 22.0, 36.0, 68.0, 105.0, 166.0, 266.0, 504.0, 1878.0, 2726368.0, 413560.0, 1536.0, 440.0, 246.0, 163.0, 87.0, 54.0, 41.0, 31.0, 21.0, 15.0, 13.0, 7.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.25, -73.7041015625, -71.158203125, -68.6123046875, -66.06640625, -63.5205078125, -60.974609375, -58.4287109375, -55.8828125, -53.3369140625, -50.791015625, -48.2451171875, -45.69921875, -43.1533203125, -40.607421875, -38.0615234375, -35.515625, -32.9697265625, -30.423828125, -27.8779296875, -25.33203125, -22.7861328125, -20.240234375, -17.6943359375, -15.1484375, -12.6025390625, -10.056640625, -7.5107421875, -4.96484375, -2.4189453125, 0.126953125, 2.6728515625, 5.21875, 7.7646484375, 10.310546875, 12.8564453125, 15.40234375, 17.9482421875, 20.494140625, 23.0400390625, 25.5859375, 28.1318359375, 30.677734375, 33.2236328125, 35.76953125, 38.3154296875, 40.861328125, 43.4072265625, 45.953125, 48.4990234375, 51.044921875, 53.5908203125, 56.13671875, 58.6826171875, 61.228515625, 63.7744140625, 66.3203125, 68.8662109375, 71.412109375, 73.9580078125, 76.50390625, 79.0498046875, 81.595703125, 84.1416015625, 86.6875]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 9.0, 26.0, 163.0, 310.0, 317.0, 137.0, 41.0, 7.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.58265686035156, -36.074092864990234, -34.56553268432617, -33.056968688964844, -31.54840850830078, -30.039846420288086, -28.53128433227539, -27.022720336914062, -25.51416015625, -24.005598068237305, -22.49703598022461, -20.988473892211914, -19.47991180419922, -17.971349716186523, -16.462787628173828, -14.954224586486816, -13.445661544799805, -11.93709945678711, -10.428537368774414, -8.919975280761719, -7.411412715911865, -5.90285062789917, -4.394288063049316, -2.885725975036621, -1.3771638870239258, 0.13139832019805908, 1.639960527420044, 3.1485228538513184, 4.657084941864014, 6.165647029876709, 7.6742095947265625, 9.182771682739258, 10.691333770751953, 12.199895858764648, 13.708457946777344, 15.217020034790039, 16.725582122802734, 18.23414421081543, 19.742706298828125, 21.251270294189453, 22.759830474853516, 24.26839256286621, 25.776954650878906, 27.2855167388916, 28.794078826904297, 30.302640914916992, 31.811203002929688, 33.319766998291016, 34.828330993652344, 36.33689498901367, 37.845455169677734, 39.35401916503906, 40.862579345703125, 42.37114334106445, 43.879703521728516, 45.388267517089844, 46.896827697753906, 48.405391693115234, 49.9139518737793, 51.422515869140625, 52.93107604980469, 54.439640045166016, 55.94820022583008, 57.456764221191406, 58.96532440185547]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 6.0, 6.0, 6.0, 7.0, 12.0, 14.0, 20.0, 15.0, 16.0, 16.0, 27.0, 28.0, 26.0, 44.0, 27.0, 38.0, 38.0, 46.0, 43.0, 44.0, 36.0, 53.0, 49.0, 40.0, 39.0, 43.0, 35.0, 26.0, 30.0, 24.0, 18.0, 24.0, 19.0, 18.0, 11.0, 12.0, 16.0, 6.0, 3.0, 6.0, 4.0, 5.0, 0.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.525245666503906, -54.71100616455078, -52.896766662597656, -51.08252716064453, -49.268287658691406, -47.45404815673828, -45.63980484008789, -43.825565338134766, -42.01132583618164, -40.197086334228516, -38.38284683227539, -36.568607330322266, -34.754364013671875, -32.94012451171875, -31.125885009765625, -29.3116455078125, -27.497406005859375, -25.68316650390625, -23.868927001953125, -22.054685592651367, -20.240446090698242, -18.426206588745117, -16.61196517944336, -14.797725677490234, -12.98348617553711, -11.169246673583984, -9.355006217956543, -7.54076623916626, -5.726526260375977, -3.9122867584228516, -2.09804630279541, -0.28380584716796875, 1.5304336547851562, 3.3446736335754395, 5.158913612365723, 6.973153591156006, 8.787393569946289, 10.601633071899414, 12.415873527526855, 14.230113983154297, 16.044353485107422, 17.858592987060547, 19.672832489013672, 21.48707389831543, 23.301313400268555, 25.11555290222168, 26.929794311523438, 28.744033813476562, 30.558273315429688, 32.37251281738281, 34.18675231933594, 36.00099182128906, 37.81523132324219, 39.62947082519531, 41.4437141418457, 43.25795364379883, 45.07219314575195, 46.88643264770508, 48.7006721496582, 50.51491165161133, 52.32915496826172, 54.143394470214844, 55.95763397216797, 57.771873474121094, 59.58611297607422]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 8.0, 1.0, 4.0, 9.0, 9.0, 11.0, 9.0, 20.0, 8.0, 14.0, 19.0, 25.0, 36.0, 23.0, 31.0, 32.0, 30.0, 43.0, 31.0, 61.0, 41.0, 41.0, 45.0, 52.0, 30.0, 39.0, 36.0, 33.0, 40.0, 25.0, 31.0, 28.0, 20.0, 24.0, 13.0, 17.0, 16.0, 13.0, 10.0, 5.0, 1.0, 6.0, 4.0, 6.0, 5.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.0859375, -5.8760986328125, -5.666259765625, -5.4564208984375, -5.24658203125, -5.0367431640625, -4.826904296875, -4.6170654296875, -4.4072265625, -4.1973876953125, -3.987548828125, -3.7777099609375, -3.56787109375, -3.3580322265625, -3.148193359375, -2.9383544921875, -2.728515625, -2.5186767578125, -2.308837890625, -2.0989990234375, -1.88916015625, -1.6793212890625, -1.469482421875, -1.2596435546875, -1.0498046875, -0.8399658203125, -0.630126953125, -0.4202880859375, -0.21044921875, -0.0006103515625, 0.209228515625, 0.4190673828125, 0.62890625, 0.8387451171875, 1.048583984375, 1.2584228515625, 1.46826171875, 1.6781005859375, 1.887939453125, 2.0977783203125, 2.3076171875, 2.5174560546875, 2.727294921875, 2.9371337890625, 3.14697265625, 3.3568115234375, 3.566650390625, 3.7764892578125, 3.986328125, 4.1961669921875, 4.406005859375, 4.6158447265625, 4.82568359375, 5.0355224609375, 5.245361328125, 5.4552001953125, 5.6650390625, 5.8748779296875, 6.084716796875, 6.2945556640625, 6.50439453125, 6.7142333984375, 6.924072265625, 7.1339111328125, 7.34375]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 2.0, 3.0, 14.0, 5.0, 10.0, 14.0, 17.0, 28.0, 22.0, 26.0, 39.0, 42.0, 48.0, 59.0, 79.0, 111.0, 175.0, 280.0, 718.0, 2210.0, 11054.0, 103648.0, 1550228.0, 2300031.0, 203154.0, 17149.0, 3107.0, 904.0, 361.0, 180.0, 129.0, 97.0, 81.0, 50.0, 40.0, 34.0, 27.0, 32.0, 19.0, 10.0, 11.0, 12.0, 7.0, 10.0, 4.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.8125, -13.28369140625, -12.7548828125, -12.22607421875, -11.697265625, -11.16845703125, -10.6396484375, -10.11083984375, -9.58203125, -9.05322265625, -8.5244140625, -7.99560546875, -7.466796875, -6.93798828125, -6.4091796875, -5.88037109375, -5.3515625, -4.82275390625, -4.2939453125, -3.76513671875, -3.236328125, -2.70751953125, -2.1787109375, -1.64990234375, -1.12109375, -0.59228515625, -0.0634765625, 0.46533203125, 0.994140625, 1.52294921875, 2.0517578125, 2.58056640625, 3.109375, 3.63818359375, 4.1669921875, 4.69580078125, 5.224609375, 5.75341796875, 6.2822265625, 6.81103515625, 7.33984375, 7.86865234375, 8.3974609375, 8.92626953125, 9.455078125, 9.98388671875, 10.5126953125, 11.04150390625, 11.5703125, 12.09912109375, 12.6279296875, 13.15673828125, 13.685546875, 14.21435546875, 14.7431640625, 15.27197265625, 15.80078125, 16.32958984375, 16.8583984375, 17.38720703125, 17.916015625, 18.44482421875, 18.9736328125, 19.50244140625, 20.03125]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 13.0, 12.0, 12.0, 19.0, 26.0, 51.0, 52.0, 56.0, 88.0, 98.0, 136.0, 166.0, 208.0, 292.0, 390.0, 456.0, 442.0, 378.0, 290.0, 225.0, 160.0, 128.0, 98.0, 62.0, 60.0, 34.0, 28.0, 33.0, 20.0, 10.0, 10.0, 5.0, 8.0, 4.0, 2.0, 0.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-13.4609375, -13.086181640625, -12.71142578125, -12.336669921875, -11.9619140625, -11.587158203125, -11.21240234375, -10.837646484375, -10.462890625, -10.088134765625, -9.71337890625, -9.338623046875, -8.9638671875, -8.589111328125, -8.21435546875, -7.839599609375, -7.46484375, -7.090087890625, -6.71533203125, -6.340576171875, -5.9658203125, -5.591064453125, -5.21630859375, -4.841552734375, -4.466796875, -4.092041015625, -3.71728515625, -3.342529296875, -2.9677734375, -2.593017578125, -2.21826171875, -1.843505859375, -1.46875, -1.093994140625, -0.71923828125, -0.344482421875, 0.0302734375, 0.405029296875, 0.77978515625, 1.154541015625, 1.529296875, 1.904052734375, 2.27880859375, 2.653564453125, 3.0283203125, 3.403076171875, 3.77783203125, 4.152587890625, 4.52734375, 4.902099609375, 5.27685546875, 5.651611328125, 6.0263671875, 6.401123046875, 6.77587890625, 7.150634765625, 7.525390625, 7.900146484375, 8.27490234375, 8.649658203125, 9.0244140625, 9.399169921875, 9.77392578125, 10.148681640625, 10.5234375]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 4.0, 9.0, 9.0, 13.0, 18.0, 31.0, 39.0, 32.0, 46.0, 71.0, 97.0, 102.0, 143.0, 160.0, 255.0, 303.0, 543.0, 2324.0, 153659.0, 3984583.0, 48541.0, 1483.0, 479.0, 292.0, 209.0, 198.0, 135.0, 116.0, 96.0, 64.0, 54.0, 52.0, 34.0, 25.0, 19.0, 10.0, 16.0, 4.0, 6.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.71875, -43.08642578125, -41.4541015625, -39.82177734375, -38.189453125, -36.55712890625, -34.9248046875, -33.29248046875, -31.66015625, -30.02783203125, -28.3955078125, -26.76318359375, -25.130859375, -23.49853515625, -21.8662109375, -20.23388671875, -18.6015625, -16.96923828125, -15.3369140625, -13.70458984375, -12.072265625, -10.43994140625, -8.8076171875, -7.17529296875, -5.54296875, -3.91064453125, -2.2783203125, -0.64599609375, 0.986328125, 2.61865234375, 4.2509765625, 5.88330078125, 7.515625, 9.14794921875, 10.7802734375, 12.41259765625, 14.044921875, 15.67724609375, 17.3095703125, 18.94189453125, 20.57421875, 22.20654296875, 23.8388671875, 25.47119140625, 27.103515625, 28.73583984375, 30.3681640625, 32.00048828125, 33.6328125, 35.26513671875, 36.8974609375, 38.52978515625, 40.162109375, 41.79443359375, 43.4267578125, 45.05908203125, 46.69140625, 48.32373046875, 49.9560546875, 51.58837890625, 53.220703125, 54.85302734375, 56.4853515625, 58.11767578125, 59.75]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 16.0, 127.0, 353.0, 378.0, 117.0, 20.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-119.40177154541016, -113.42817687988281, -107.45457458496094, -101.4809799194336, -95.50738525390625, -89.53378295898438, -83.56018829345703, -77.58659362792969, -71.61299133300781, -65.63939666748047, -59.66579818725586, -53.69219970703125, -47.718605041503906, -41.7450065612793, -35.77140808105469, -29.797813415527344, -23.82421875, -17.850622177124023, -11.87702465057373, -5.9034271240234375, 0.07016944885253906, 6.043766021728516, 12.017364501953125, 17.99095916748047, 23.964557647705078, 29.938154220581055, 35.91175079345703, 41.88534927368164, 47.85894775390625, 53.832542419433594, 59.8061408996582, 65.77973937988281, 71.75334167480469, 77.72693634033203, 83.7005386352539, 89.67413330078125, 95.6477279663086, 101.62132263183594, 107.59492492675781, 113.56851959228516, 119.5421142578125, 125.51570892333984, 131.4893035888672, 137.46290588378906, 143.43650817871094, 149.41009521484375, 155.38369750976562, 161.3572998046875, 167.33090209960938, 173.30450439453125, 179.27809143066406, 185.25169372558594, 191.2252960205078, 197.19888305664062, 203.1724853515625, 209.14608764648438, 215.1196746826172, 221.09327697753906, 227.06686401367188, 233.04046630859375, 239.01406860351562, 244.98765563964844, 250.9612579345703, 256.9348449707031, 262.908447265625]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 2.0, 9.0, 9.0, 13.0, 14.0, 15.0, 11.0, 19.0, 26.0, 27.0, 28.0, 24.0, 38.0, 32.0, 38.0, 51.0, 50.0, 42.0, 45.0, 42.0, 54.0, 42.0, 42.0, 35.0, 31.0, 40.0, 34.0, 30.0, 28.0, 21.0, 24.0, 16.0, 18.0, 7.0, 10.0, 13.0, 4.0, 5.0, 3.0, 2.0, 3.0, 6.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-49.3616943359375, -47.98292541503906, -46.60416030883789, -45.22539138793945, -43.84662628173828, -42.467857360839844, -41.089088439941406, -39.71031951904297, -38.3315544128418, -36.95278549194336, -35.57402038574219, -34.19525146484375, -32.81648254394531, -31.43771743774414, -30.058948516845703, -28.6801815032959, -27.301414489746094, -25.92264747619629, -24.543880462646484, -23.165111541748047, -21.786344528198242, -20.407577514648438, -19.02880859375, -17.650041580200195, -16.27127456665039, -14.892507553100586, -13.513739585876465, -12.134971618652344, -10.756204605102539, -9.377437591552734, -7.998669624328613, -6.619901657104492, -5.2411346435546875, -3.8623671531677246, -2.4835996627807617, -1.1048321723937988, 0.27393531799316406, 1.652702808380127, 3.03147029876709, 4.410238265991211, 5.789005279541016, 7.1677727699279785, 8.546540260314941, 9.925308227539062, 11.304075241088867, 12.682842254638672, 14.061610221862793, 15.440378189086914, 16.81914520263672, 18.197912216186523, 19.576679229736328, 20.955448150634766, 22.33421516418457, 23.712982177734375, 25.091751098632812, 26.470518112182617, 27.849285125732422, 29.228052139282227, 30.60681915283203, 31.98558807373047, 33.364356994628906, 34.74312210083008, 36.121891021728516, 37.50065612792969, 38.879425048828125]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 1.0, 4.0, 2.0, 7.0, 5.0, 9.0, 6.0, 12.0, 9.0, 11.0, 20.0, 16.0, 15.0, 16.0, 27.0, 28.0, 32.0, 34.0, 36.0, 40.0, 39.0, 33.0, 39.0, 46.0, 44.0, 49.0, 37.0, 29.0, 41.0, 29.0, 30.0, 34.0, 47.0, 24.0, 24.0, 11.0, 13.0, 26.0, 20.0, 16.0, 9.0, 7.0, 6.0, 5.0, 6.0, 6.0, 3.0, 4.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.5234375, -5.3228759765625, -5.122314453125, -4.9217529296875, -4.72119140625, -4.5206298828125, -4.320068359375, -4.1195068359375, -3.9189453125, -3.7183837890625, -3.517822265625, -3.3172607421875, -3.11669921875, -2.9161376953125, -2.715576171875, -2.5150146484375, -2.314453125, -2.1138916015625, -1.913330078125, -1.7127685546875, -1.51220703125, -1.3116455078125, -1.111083984375, -0.9105224609375, -0.7099609375, -0.5093994140625, -0.308837890625, -0.1082763671875, 0.09228515625, 0.2928466796875, 0.493408203125, 0.6939697265625, 0.89453125, 1.0950927734375, 1.295654296875, 1.4962158203125, 1.69677734375, 1.8973388671875, 2.097900390625, 2.2984619140625, 2.4990234375, 2.6995849609375, 2.900146484375, 3.1007080078125, 3.30126953125, 3.5018310546875, 3.702392578125, 3.9029541015625, 4.103515625, 4.3040771484375, 4.504638671875, 4.7052001953125, 4.90576171875, 5.1063232421875, 5.306884765625, 5.5074462890625, 5.7080078125, 5.9085693359375, 6.109130859375, 6.3096923828125, 6.51025390625, 6.7108154296875, 6.911376953125, 7.1119384765625, 7.3125]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 1.0, 4.0, 8.0, 7.0, 9.0, 17.0, 13.0, 41.0, 57.0, 58.0, 101.0, 155.0, 226.0, 282.0, 479.0, 760.0, 1077.0, 1703.0, 2625.0, 4058.0, 6268.0, 10183.0, 16396.0, 26203.0, 42071.0, 68373.0, 106964.0, 154932.0, 181413.0, 149102.0, 101952.0, 64911.0, 40696.0, 25227.0, 15575.0, 9709.0, 5865.0, 3936.0, 2393.0, 1551.0, 1005.0, 681.0, 501.0, 311.0, 211.0, 136.0, 84.0, 79.0, 45.0, 33.0, 27.0, 20.0, 10.0, 8.0, 6.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.63916015625, -0.61883544921875, -0.5985107421875, -0.57818603515625, -0.557861328125, -0.53753662109375, -0.5172119140625, -0.49688720703125, -0.4765625, -0.45623779296875, -0.4359130859375, -0.41558837890625, -0.395263671875, -0.37493896484375, -0.3546142578125, -0.33428955078125, -0.31396484375, -0.29364013671875, -0.2733154296875, -0.25299072265625, -0.232666015625, -0.21234130859375, -0.1920166015625, -0.17169189453125, -0.1513671875, -0.13104248046875, -0.1107177734375, -0.09039306640625, -0.070068359375, -0.04974365234375, -0.0294189453125, -0.00909423828125, 0.01123046875, 0.03155517578125, 0.0518798828125, 0.07220458984375, 0.092529296875, 0.11285400390625, 0.1331787109375, 0.15350341796875, 0.173828125, 0.19415283203125, 0.2144775390625, 0.23480224609375, 0.255126953125, 0.27545166015625, 0.2957763671875, 0.31610107421875, 0.33642578125, 0.35675048828125, 0.3770751953125, 0.39739990234375, 0.417724609375, 0.43804931640625, 0.4583740234375, 0.47869873046875, 0.4990234375, 0.51934814453125, 0.5396728515625, 0.55999755859375, 0.580322265625, 0.60064697265625, 0.6209716796875, 0.64129638671875, 0.66162109375]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 7.0, 6.0, 3.0, 14.0, 19.0, 12.0, 12.0, 14.0, 24.0, 27.0, 29.0, 24.0, 32.0, 42.0, 40.0, 37.0, 60.0, 43.0, 47.0, 1067.0, 52.0, 47.0, 35.0, 42.0, 40.0, 45.0, 41.0, 33.0, 21.0, 14.0, 25.0, 20.0, 16.0, 8.0, 2.0, 7.0, 5.0, 3.0, 4.0, 6.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-5.0546875, -4.91143798828125, -4.7681884765625, -4.62493896484375, -4.481689453125, -4.33843994140625, -4.1951904296875, -4.05194091796875, -3.90869140625, -3.76544189453125, -3.6221923828125, -3.47894287109375, -3.335693359375, -3.19244384765625, -3.0491943359375, -2.90594482421875, -2.7626953125, -2.61944580078125, -2.4761962890625, -2.33294677734375, -2.189697265625, -2.04644775390625, -1.9031982421875, -1.75994873046875, -1.61669921875, -1.47344970703125, -1.3302001953125, -1.18695068359375, -1.043701171875, -0.90045166015625, -0.7572021484375, -0.61395263671875, -0.470703125, -0.32745361328125, -0.1842041015625, -0.04095458984375, 0.102294921875, 0.24554443359375, 0.3887939453125, 0.53204345703125, 0.67529296875, 0.81854248046875, 0.9617919921875, 1.10504150390625, 1.248291015625, 1.39154052734375, 1.5347900390625, 1.67803955078125, 1.8212890625, 1.96453857421875, 2.1077880859375, 2.25103759765625, 2.394287109375, 2.53753662109375, 2.6807861328125, 2.82403564453125, 2.96728515625, 3.11053466796875, 3.2537841796875, 3.39703369140625, 3.540283203125, 3.68353271484375, 3.8267822265625, 3.97003173828125, 4.11328125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 7.0, 13.0, 10.0, 15.0, 19.0, 59.0, 74.0, 135.0, 184.0, 333.0, 512.0, 909.0, 1331.0, 2290.0, 3638.0, 5870.0, 9420.0, 15302.0, 24481.0, 38759.0, 62394.0, 95587.0, 135797.0, 1212029.0, 157605.0, 117736.0, 78735.0, 50538.0, 31765.0, 19473.0, 12232.0, 7448.0, 4716.0, 2938.0, 1830.0, 1152.0, 681.0, 444.0, 249.0, 170.0, 97.0, 60.0, 37.0, 23.0, 15.0, 7.0, 6.0, 2.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.495361328125, -0.4797706604003906, -0.46417999267578125, -0.4485893249511719, -0.4329986572265625, -0.4174079895019531, -0.40181732177734375, -0.3862266540527344, -0.370635986328125, -0.3550453186035156, -0.33945465087890625, -0.3238639831542969, -0.3082733154296875, -0.2926826477050781, -0.27709197998046875, -0.2615013122558594, -0.24591064453125, -0.23031997680664062, -0.21472930908203125, -0.19913864135742188, -0.1835479736328125, -0.16795730590820312, -0.15236663818359375, -0.13677597045898438, -0.121185302734375, -0.10559463500976562, -0.09000396728515625, -0.07441329956054688, -0.0588226318359375, -0.043231964111328125, -0.02764129638671875, -0.012050628662109375, 0.0035400390625, 0.019130706787109375, 0.03472137451171875, 0.050312042236328125, 0.0659027099609375, 0.08149337768554688, 0.09708404541015625, 0.11267471313476562, 0.128265380859375, 0.14385604858398438, 0.15944671630859375, 0.17503738403320312, 0.1906280517578125, 0.20621871948242188, 0.22180938720703125, 0.23740005493164062, 0.25299072265625, 0.2685813903808594, 0.28417205810546875, 0.2997627258300781, 0.3153533935546875, 0.3309440612792969, 0.34653472900390625, 0.3621253967285156, 0.377716064453125, 0.3933067321777344, 0.40889739990234375, 0.4244880676269531, 0.4400787353515625, 0.4556694030761719, 0.47126007080078125, 0.4868507385253906, 0.50244140625]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 4.0, 5.0, 6.0, 2.0, 13.0, 13.0, 19.0, 21.0, 19.0, 20.0, 34.0, 48.0, 64.0, 69.0, 85.0, 78.0, 95.0, 67.0, 83.0, 40.0, 47.0, 38.0, 20.0, 23.0, 16.0, 11.0, 13.0, 11.0, 4.0, 7.0, 7.0, 5.0, 3.0, 4.0, 3.0, 3.0, 5.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.004192352294921875, -0.0040648579597473145, -0.003937363624572754, -0.0038098692893981934, -0.003682374954223633, -0.0035548806190490723, -0.0034273862838745117, -0.003299891948699951, -0.0031723976135253906, -0.00304490327835083, -0.0029174089431762695, -0.002789914608001709, -0.0026624202728271484, -0.002534925937652588, -0.0024074316024780273, -0.002279937267303467, -0.0021524429321289062, -0.0020249485969543457, -0.0018974542617797852, -0.0017699599266052246, -0.001642465591430664, -0.0015149712562561035, -0.001387476921081543, -0.0012599825859069824, -0.0011324882507324219, -0.0010049939155578613, -0.0008774995803833008, -0.0007500052452087402, -0.0006225109100341797, -0.0004950165748596191, -0.0003675222396850586, -0.00024002790451049805, -0.0001125335693359375, 1.4960765838623047e-05, 0.0001424551010131836, 0.00026994943618774414, 0.0003974437713623047, 0.0005249381065368652, 0.0006524324417114258, 0.0007799267768859863, 0.0009074211120605469, 0.0010349154472351074, 0.001162409782409668, 0.0012899041175842285, 0.001417398452758789, 0.0015448927879333496, 0.0016723871231079102, 0.0017998814582824707, 0.0019273757934570312, 0.002054870128631592, 0.0021823644638061523, 0.002309858798980713, 0.0024373531341552734, 0.002564847469329834, 0.0026923418045043945, 0.002819836139678955, 0.0029473304748535156, 0.003074824810028076, 0.0032023191452026367, 0.0033298134803771973, 0.003457307815551758, 0.0035848021507263184, 0.003712296485900879, 0.0038397908210754395, 0.00396728515625]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 4.0, 2.0, 1.0, 5.0, 2.0, 4.0, 0.0, 5.0, 8.0, 10.0, 6.0, 11.0, 11.0, 17.0, 21.0, 27.0, 32.0, 45.0, 63.0, 90.0, 135.0, 251.0, 993.0, 70357.0, 972484.0, 3038.0, 363.0, 203.0, 121.0, 76.0, 41.0, 32.0, 26.0, 24.0, 12.0, 14.0, 15.0, 3.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.083740234375, -0.08087348937988281, -0.07800674438476562, -0.07513999938964844, -0.07227325439453125, -0.06940650939941406, -0.06653976440429688, -0.06367301940917969, -0.0608062744140625, -0.05793952941894531, -0.055072784423828125, -0.05220603942871094, -0.04933929443359375, -0.04647254943847656, -0.043605804443359375, -0.04073905944824219, -0.037872314453125, -0.03500556945800781, -0.032138824462890625, -0.029272079467773438, -0.02640533447265625, -0.023538589477539062, -0.020671844482421875, -0.017805099487304688, -0.0149383544921875, -0.012071609497070312, -0.009204864501953125, -0.0063381195068359375, -0.00347137451171875, -0.0006046295166015625, 0.002262115478515625, 0.0051288604736328125, 0.00799560546875, 0.010862350463867188, 0.013729095458984375, 0.016595840454101562, 0.01946258544921875, 0.022329330444335938, 0.025196075439453125, 0.028062820434570312, 0.0309295654296875, 0.03379631042480469, 0.036663055419921875, 0.03952980041503906, 0.04239654541015625, 0.04526329040527344, 0.048130035400390625, 0.05099678039550781, 0.053863525390625, 0.05673027038574219, 0.059597015380859375, 0.06246376037597656, 0.06533050537109375, 0.06819725036621094, 0.07106399536132812, 0.07393074035644531, 0.0767974853515625, 0.07966423034667969, 0.08253097534179688, 0.08539772033691406, 0.08826446533203125, 0.09113121032714844, 0.09399795532226562, 0.09686470031738281, 0.0997314453125]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 4.0, 10.0, 15.0, 29.0, 61.0, 104.0, 203.0, 230.0, 169.0, 85.0, 50.0, 28.0, 15.0, 6.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0018103704787790775, -0.0016513746231794357, -0.0014923788839951158, -0.0013333831448107958, -0.001174387289211154, -0.0010153914336115122, -0.0008563956944271922, -0.0006973999552428722, -0.0005384040996432304, -0.00037940830225124955, -0.00022041250485926867, -6.141670746728778e-05, 9.757908992469311e-05, 0.000256574887316674, 0.0004155706847086549, 0.0005745664238929749, 0.0007335622794926167, 0.0008925580768845975, 0.0010515538742765784, 0.0012105496134608984, 0.0013695454690605402, 0.001528541324660182, 0.001687537063844502, 0.001846532803028822, 0.0020055286586284637, 0.0021645245142281055, 0.0023235203698277473, 0.0024825159925967455, 0.0026415118481963873, 0.002800507703796029, 0.0029595033265650272, 0.003118499182164669, 0.003277495503425598, 0.00343649135902524, 0.0035954872146248817, 0.00375448283739388, 0.003913478925824165, 0.00407247431576252, 0.004231470171362162, 0.0043904660269618034, 0.004549461882561445, 0.004708457738161087, 0.004867453593760729, 0.005026449449360371, 0.005185444839298725, 0.005344440694898367, 0.005503436550498009, 0.0056624324060976505, 0.005821428261697292, 0.005980424117296934, 0.006139419972896576, 0.006298415828496218, 0.0064574116840958595, 0.006616407074034214, 0.006775402929633856, 0.006934398785233498, 0.007093394640833139, 0.007252390496432781, 0.007411386352032423, 0.007570382207632065, 0.007729377597570419, 0.007888373918831348, 0.008047369308769703, 0.008206365630030632, 0.008365361019968987]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 5.0, 5.0, 7.0, 9.0, 8.0, 11.0, 12.0, 12.0, 13.0, 22.0, 35.0, 36.0, 24.0, 38.0, 42.0, 23.0, 43.0, 46.0, 43.0, 35.0, 41.0, 40.0, 29.0, 46.0, 31.0, 37.0, 34.0, 35.0, 30.0, 30.0, 34.0, 28.0, 15.0, 19.0, 9.0, 19.0, 14.0, 9.0, 4.0, 9.0, 6.0, 3.0, 4.0, 1.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.0019698143005371094, -0.0019105495885014534, -0.0018512848764657974, -0.0017920201644301414, -0.0017327554523944855, -0.0016734907403588295, -0.0016142260283231735, -0.0015549613162875175, -0.0014956966042518616, -0.0014364318922162056, -0.0013771671801805496, -0.0013179024681448936, -0.0012586377561092377, -0.0011993730440735817, -0.0011401083320379257, -0.0010808436200022697, -0.0010215789079666138, -0.0009623141959309578, -0.0009030494838953018, -0.0008437847718596458, -0.0007845200598239899, -0.0007252553477883339, -0.0006659906357526779, -0.0006067259237170219, -0.000547461211681366, -0.00048819649964571, -0.000428931787610054, -0.00036966707557439804, -0.00031040236353874207, -0.0002511376515030861, -0.00019187293946743011, -0.00013260822743177414, -7.334351539611816e-05, -1.4078803360462189e-05, 4.518590867519379e-05, 0.00010445062071084976, 0.00016371533274650574, 0.0002229800447821617, 0.0002822447568178177, 0.00034150946885347366, 0.00040077418088912964, 0.0004600388929247856, 0.0005193036049604416, 0.0005785683169960976, 0.0006378330290317535, 0.0006970977410674095, 0.0007563624531030655, 0.0008156271651387215, 0.0008748918771743774, 0.0009341565892100334, 0.0009934213012456894, 0.0010526860132813454, 0.0011119507253170013, 0.0011712154373526573, 0.0012304801493883133, 0.0012897448614239693, 0.0013490095734596252, 0.0014082742854952812, 0.0014675389975309372, 0.0015268037095665932, 0.0015860684216022491, 0.0016453331336379051, 0.001704597845673561, 0.001763862557709217, 0.001823127269744873]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 1.0, 4.0, 2.0, 7.0, 5.0, 9.0, 6.0, 12.0, 9.0, 11.0, 20.0, 16.0, 15.0, 16.0, 27.0, 28.0, 32.0, 34.0, 36.0, 40.0, 39.0, 33.0, 39.0, 46.0, 45.0, 48.0, 38.0, 28.0, 41.0, 29.0, 30.0, 34.0, 47.0, 24.0, 24.0, 11.0, 13.0, 26.0, 20.0, 16.0, 9.0, 7.0, 6.0, 5.0, 6.0, 6.0, 3.0, 4.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.5234375, -5.3228759765625, -5.122314453125, -4.9217529296875, -4.72119140625, -4.5206298828125, -4.320068359375, -4.1195068359375, -3.9189453125, -3.7183837890625, -3.517822265625, -3.3172607421875, -3.11669921875, -2.9161376953125, -2.715576171875, -2.5150146484375, -2.314453125, -2.1138916015625, -1.913330078125, -1.7127685546875, -1.51220703125, -1.3116455078125, -1.111083984375, -0.9105224609375, -0.7099609375, -0.5093994140625, -0.308837890625, -0.1082763671875, 0.09228515625, 0.2928466796875, 0.493408203125, 0.6939697265625, 0.89453125, 1.0950927734375, 1.295654296875, 1.4962158203125, 1.69677734375, 1.8973388671875, 2.097900390625, 2.2984619140625, 2.4990234375, 2.6995849609375, 2.900146484375, 3.1007080078125, 3.30126953125, 3.5018310546875, 3.702392578125, 3.9029541015625, 4.103515625, 4.3040771484375, 4.504638671875, 4.7052001953125, 4.90576171875, 5.1063232421875, 5.306884765625, 5.5074462890625, 5.7080078125, 5.9085693359375, 6.109130859375, 6.3096923828125, 6.51025390625, 6.7108154296875, 6.911376953125, 7.1119384765625, 7.3125]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 9.0, 8.0, 13.0, 20.0, 21.0, 31.0, 38.0, 72.0, 113.0, 203.0, 313.0, 485.0, 798.0, 1393.0, 2177.0, 3882.0, 7034.0, 13261.0, 28969.0, 74106.0, 223881.0, 434586.0, 155868.0, 54069.0, 22348.0, 10878.0, 5764.0, 3230.0, 1928.0, 1196.0, 664.0, 444.0, 250.0, 193.0, 109.0, 63.0, 43.0, 32.0, 22.0, 12.0, 11.0, 5.0, 7.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.15234375, -4.9930419921875, -4.833740234375, -4.6744384765625, -4.51513671875, -4.3558349609375, -4.196533203125, -4.0372314453125, -3.8779296875, -3.7186279296875, -3.559326171875, -3.4000244140625, -3.24072265625, -3.0814208984375, -2.922119140625, -2.7628173828125, -2.603515625, -2.4442138671875, -2.284912109375, -2.1256103515625, -1.96630859375, -1.8070068359375, -1.647705078125, -1.4884033203125, -1.3291015625, -1.1697998046875, -1.010498046875, -0.8511962890625, -0.69189453125, -0.5325927734375, -0.373291015625, -0.2139892578125, -0.0546875, 0.1046142578125, 0.263916015625, 0.4232177734375, 0.58251953125, 0.7418212890625, 0.901123046875, 1.0604248046875, 1.2197265625, 1.3790283203125, 1.538330078125, 1.6976318359375, 1.85693359375, 2.0162353515625, 2.175537109375, 2.3348388671875, 2.494140625, 2.6534423828125, 2.812744140625, 2.9720458984375, 3.13134765625, 3.2906494140625, 3.449951171875, 3.6092529296875, 3.7685546875, 3.9278564453125, 4.087158203125, 4.2464599609375, 4.40576171875, 4.5650634765625, 4.724365234375, 4.8836669921875, 5.04296875]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 4.0, 5.0, 4.0, 3.0, 6.0, 9.0, 15.0, 19.0, 12.0, 14.0, 19.0, 25.0, 30.0, 38.0, 32.0, 41.0, 51.0, 52.0, 73.0, 97.0, 286.0, 1617.0, 145.0, 66.0, 58.0, 58.0, 35.0, 35.0, 28.0, 30.0, 28.0, 21.0, 20.0, 12.0, 10.0, 16.0, 11.0, 4.0, 4.0, 9.0, 4.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-22.53125, -21.80908203125, -21.0869140625, -20.36474609375, -19.642578125, -18.92041015625, -18.1982421875, -17.47607421875, -16.75390625, -16.03173828125, -15.3095703125, -14.58740234375, -13.865234375, -13.14306640625, -12.4208984375, -11.69873046875, -10.9765625, -10.25439453125, -9.5322265625, -8.81005859375, -8.087890625, -7.36572265625, -6.6435546875, -5.92138671875, -5.19921875, -4.47705078125, -3.7548828125, -3.03271484375, -2.310546875, -1.58837890625, -0.8662109375, -0.14404296875, 0.578125, 1.30029296875, 2.0224609375, 2.74462890625, 3.466796875, 4.18896484375, 4.9111328125, 5.63330078125, 6.35546875, 7.07763671875, 7.7998046875, 8.52197265625, 9.244140625, 9.96630859375, 10.6884765625, 11.41064453125, 12.1328125, 12.85498046875, 13.5771484375, 14.29931640625, 15.021484375, 15.74365234375, 16.4658203125, 17.18798828125, 17.91015625, 18.63232421875, 19.3544921875, 20.07666015625, 20.798828125, 21.52099609375, 22.2431640625, 22.96533203125, 23.6875]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 0.0, 0.0, 5.0, 3.0, 7.0, 12.0, 7.0, 12.0, 18.0, 19.0, 23.0, 22.0, 32.0, 39.0, 61.0, 74.0, 120.0, 133.0, 212.0, 301.0, 560.0, 3099.0, 855099.0, 2280285.0, 3778.0, 567.0, 329.0, 222.0, 148.0, 132.0, 91.0, 57.0, 39.0, 35.0, 38.0, 22.0, 29.0, 16.0, 16.0, 7.0, 12.0, 3.0, 3.0, 6.0, 2.0, 7.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-56.40625, -54.69873046875, -52.9912109375, -51.28369140625, -49.576171875, -47.86865234375, -46.1611328125, -44.45361328125, -42.74609375, -41.03857421875, -39.3310546875, -37.62353515625, -35.916015625, -34.20849609375, -32.5009765625, -30.79345703125, -29.0859375, -27.37841796875, -25.6708984375, -23.96337890625, -22.255859375, -20.54833984375, -18.8408203125, -17.13330078125, -15.42578125, -13.71826171875, -12.0107421875, -10.30322265625, -8.595703125, -6.88818359375, -5.1806640625, -3.47314453125, -1.765625, -0.05810546875, 1.6494140625, 3.35693359375, 5.064453125, 6.77197265625, 8.4794921875, 10.18701171875, 11.89453125, 13.60205078125, 15.3095703125, 17.01708984375, 18.724609375, 20.43212890625, 22.1396484375, 23.84716796875, 25.5546875, 27.26220703125, 28.9697265625, 30.67724609375, 32.384765625, 34.09228515625, 35.7998046875, 37.50732421875, 39.21484375, 40.92236328125, 42.6298828125, 44.33740234375, 46.044921875, 47.75244140625, 49.4599609375, 51.16748046875, 52.875]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 153.0, 806.0, 55.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.01434326171875, -22.866750717163086, -17.719158172607422, -12.571565628051758, -7.423973083496094, -2.2763805389404297, 2.8712120056152344, 8.018806457519531, 13.166397094726562, 18.313989639282227, 23.46158218383789, 28.609174728393555, 33.75676727294922, 38.90435791015625, 44.05195236206055, 49.199546813964844, 54.347137451171875, 59.494728088378906, 64.64231872558594, 69.7899169921875, 74.93750762939453, 80.08509826660156, 85.23269653320312, 90.38028717041016, 95.52787780761719, 100.67546844482422, 105.82305908203125, 110.97065734863281, 116.11824798583984, 121.26583862304688, 126.41343688964844, 131.56103515625, 136.7086181640625, 141.85621643066406, 147.00379943847656, 152.15139770507812, 157.29898071289062, 162.4465789794922, 167.59417724609375, 172.74176025390625, 177.8893585205078, 183.03695678710938, 188.18453979492188, 193.33213806152344, 198.479736328125, 203.6273193359375, 208.77491760253906, 213.92251586914062, 219.07009887695312, 224.2176971435547, 229.3652801513672, 234.51287841796875, 239.66046142578125, 244.8080596923828, 249.95565795898438, 255.10324096679688, 260.2508544921875, 265.3984375, 270.5460510253906, 275.6936340332031, 280.8412170410156, 285.98883056640625, 291.13641357421875, 296.28399658203125, 301.43157958984375]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 0.0, 2.0, 5.0, 4.0, 6.0, 8.0, 6.0, 12.0, 5.0, 9.0, 12.0, 18.0, 9.0, 18.0, 14.0, 27.0, 23.0, 24.0, 29.0, 29.0, 32.0, 29.0, 42.0, 33.0, 36.0, 42.0, 39.0, 46.0, 41.0, 32.0, 33.0, 42.0, 29.0, 37.0, 28.0, 24.0, 23.0, 22.0, 16.0, 12.0, 12.0, 12.0, 11.0, 12.0, 8.0, 8.0, 9.0, 3.0, 7.0, 6.0, 3.0, 5.0, 5.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 3.0], "bins": [-43.49616241455078, -42.049827575683594, -40.603492736816406, -39.15715789794922, -37.71082305908203, -36.26448440551758, -34.81814956665039, -33.3718147277832, -31.925479888916016, -30.479145050048828, -29.03281021118164, -27.58647346496582, -26.140138626098633, -24.693803787231445, -23.247467041015625, -21.801132202148438, -20.35479736328125, -18.908462524414062, -17.462127685546875, -16.015790939331055, -14.569456100463867, -13.12312126159668, -11.676785469055176, -10.230449676513672, -8.784114837646484, -7.337779521942139, -5.891444206237793, -4.445108890533447, -2.9987735748291016, -1.5524382591247559, -0.10610294342041016, 1.3402328491210938, 2.7865676879882812, 4.232903003692627, 5.679238319396973, 7.125573635101318, 8.571908950805664, 10.018243789672852, 11.464579582214355, 12.91091537475586, 14.357250213623047, 15.803585052490234, 17.249919891357422, 18.696256637573242, 20.14259147644043, 21.588926315307617, 23.035263061523438, 24.481597900390625, 25.927932739257812, 27.374267578125, 28.820602416992188, 30.266939163208008, 31.713274002075195, 33.159610748291016, 34.6059455871582, 36.05228042602539, 37.49861526489258, 38.944950103759766, 40.39128494262695, 41.83761978149414, 43.283958435058594, 44.73029327392578, 46.17662811279297, 47.622962951660156, 49.069297790527344]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 4.0, 1.0, 13.0, 5.0, 10.0, 10.0, 15.0, 18.0, 16.0, 17.0, 29.0, 30.0, 22.0, 30.0, 35.0, 36.0, 32.0, 34.0, 34.0, 38.0, 47.0, 44.0, 45.0, 35.0, 33.0, 29.0, 44.0, 33.0, 28.0, 34.0, 27.0, 26.0, 16.0, 24.0, 17.0, 18.0, 12.0, 11.0, 11.0, 9.0, 8.0, 5.0, 6.0, 4.0, 1.0, 0.0, 7.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.8359375, -5.63201904296875, -5.4281005859375, -5.22418212890625, -5.020263671875, -4.81634521484375, -4.6124267578125, -4.40850830078125, -4.20458984375, -4.00067138671875, -3.7967529296875, -3.59283447265625, -3.388916015625, -3.18499755859375, -2.9810791015625, -2.77716064453125, -2.5732421875, -2.36932373046875, -2.1654052734375, -1.96148681640625, -1.757568359375, -1.55364990234375, -1.3497314453125, -1.14581298828125, -0.94189453125, -0.73797607421875, -0.5340576171875, -0.33013916015625, -0.126220703125, 0.07769775390625, 0.2816162109375, 0.48553466796875, 0.689453125, 0.89337158203125, 1.0972900390625, 1.30120849609375, 1.505126953125, 1.70904541015625, 1.9129638671875, 2.11688232421875, 2.32080078125, 2.52471923828125, 2.7286376953125, 2.93255615234375, 3.136474609375, 3.34039306640625, 3.5443115234375, 3.74822998046875, 3.9521484375, 4.15606689453125, 4.3599853515625, 4.56390380859375, 4.767822265625, 4.97174072265625, 5.1756591796875, 5.37957763671875, 5.58349609375, 5.78741455078125, 5.9913330078125, 6.19525146484375, 6.399169921875, 6.60308837890625, 6.8070068359375, 7.01092529296875, 7.21484375]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 7.0, 0.0, 5.0, 4.0, 10.0, 6.0, 16.0, 11.0, 14.0, 12.0, 12.0, 33.0, 26.0, 32.0, 46.0, 56.0, 93.0, 205.0, 436.0, 1288.0, 4578.0, 27088.0, 519366.0, 3174116.0, 436548.0, 23766.0, 4187.0, 1221.0, 489.0, 215.0, 105.0, 59.0, 52.0, 37.0, 19.0, 28.0, 20.0, 17.0, 14.0, 14.0, 12.0, 7.0, 5.0, 3.0, 4.0, 4.0, 4.0, 1.0, 6.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.546875, -15.921875, -15.296875, -14.671875, -14.046875, -13.421875, -12.796875, -12.171875, -11.546875, -10.921875, -10.296875, -9.671875, -9.046875, -8.421875, -7.796875, -7.171875, -6.546875, -5.921875, -5.296875, -4.671875, -4.046875, -3.421875, -2.796875, -2.171875, -1.546875, -0.921875, -0.296875, 0.328125, 0.953125, 1.578125, 2.203125, 2.828125, 3.453125, 4.078125, 4.703125, 5.328125, 5.953125, 6.578125, 7.203125, 7.828125, 8.453125, 9.078125, 9.703125, 10.328125, 10.953125, 11.578125, 12.203125, 12.828125, 13.453125, 14.078125, 14.703125, 15.328125, 15.953125, 16.578125, 17.203125, 17.828125, 18.453125, 19.078125, 19.703125, 20.328125, 20.953125, 21.578125, 22.203125, 22.828125, 23.453125]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 4.0, 6.0, 6.0, 4.0, 11.0, 12.0, 9.0, 16.0, 13.0, 32.0, 35.0, 32.0, 39.0, 56.0, 86.0, 87.0, 115.0, 152.0, 187.0, 251.0, 333.0, 392.0, 407.0, 387.0, 323.0, 224.0, 202.0, 149.0, 114.0, 97.0, 52.0, 60.0, 35.0, 31.0, 22.0, 20.0, 14.0, 17.0, 10.0, 12.0, 10.0, 5.0, 3.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-10.921875, -10.594482421875, -10.26708984375, -9.939697265625, -9.6123046875, -9.284912109375, -8.95751953125, -8.630126953125, -8.302734375, -7.975341796875, -7.64794921875, -7.320556640625, -6.9931640625, -6.665771484375, -6.33837890625, -6.010986328125, -5.68359375, -5.356201171875, -5.02880859375, -4.701416015625, -4.3740234375, -4.046630859375, -3.71923828125, -3.391845703125, -3.064453125, -2.737060546875, -2.40966796875, -2.082275390625, -1.7548828125, -1.427490234375, -1.10009765625, -0.772705078125, -0.4453125, -0.117919921875, 0.20947265625, 0.536865234375, 0.8642578125, 1.191650390625, 1.51904296875, 1.846435546875, 2.173828125, 2.501220703125, 2.82861328125, 3.156005859375, 3.4833984375, 3.810791015625, 4.13818359375, 4.465576171875, 4.79296875, 5.120361328125, 5.44775390625, 5.775146484375, 6.1025390625, 6.429931640625, 6.75732421875, 7.084716796875, 7.412109375, 7.739501953125, 8.06689453125, 8.394287109375, 8.7216796875, 9.049072265625, 9.37646484375, 9.703857421875, 10.03125]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 4.0, 5.0, 1.0, 9.0, 16.0, 15.0, 15.0, 19.0, 25.0, 31.0, 47.0, 58.0, 65.0, 78.0, 105.0, 125.0, 182.0, 219.0, 305.0, 402.0, 1587.0, 41038.0, 3824102.0, 319366.0, 4392.0, 592.0, 311.0, 219.0, 191.0, 159.0, 107.0, 98.0, 81.0, 65.0, 61.0, 39.0, 36.0, 32.0, 17.0, 21.0, 7.0, 11.0, 9.0, 5.0, 7.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-48.84375, -47.30322265625, -45.7626953125, -44.22216796875, -42.681640625, -41.14111328125, -39.6005859375, -38.06005859375, -36.51953125, -34.97900390625, -33.4384765625, -31.89794921875, -30.357421875, -28.81689453125, -27.2763671875, -25.73583984375, -24.1953125, -22.65478515625, -21.1142578125, -19.57373046875, -18.033203125, -16.49267578125, -14.9521484375, -13.41162109375, -11.87109375, -10.33056640625, -8.7900390625, -7.24951171875, -5.708984375, -4.16845703125, -2.6279296875, -1.08740234375, 0.453125, 1.99365234375, 3.5341796875, 5.07470703125, 6.615234375, 8.15576171875, 9.6962890625, 11.23681640625, 12.77734375, 14.31787109375, 15.8583984375, 17.39892578125, 18.939453125, 20.47998046875, 22.0205078125, 23.56103515625, 25.1015625, 26.64208984375, 28.1826171875, 29.72314453125, 31.263671875, 32.80419921875, 34.3447265625, 35.88525390625, 37.42578125, 38.96630859375, 40.5068359375, 42.04736328125, 43.587890625, 45.12841796875, 46.6689453125, 48.20947265625, 49.75]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 6.0, 12.0, 43.0, 81.0, 157.0, 204.0, 213.0, 153.0, 89.0, 36.0, 14.0, 6.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-96.66555786132812, -93.73625183105469, -90.80694580078125, -87.87764739990234, -84.9483413696289, -82.01903533935547, -79.08973693847656, -76.16043090820312, -73.23112487792969, -70.30181884765625, -67.37251281738281, -64.4432144165039, -61.51390838623047, -58.58460235595703, -55.65530014038086, -52.72599792480469, -49.79669189453125, -46.86738586425781, -43.93808364868164, -41.00878143310547, -38.07947540283203, -35.150169372558594, -32.22086715698242, -29.291563034057617, -26.362258911132812, -23.432954788208008, -20.503650665283203, -17.5743465423584, -14.645042419433594, -11.715738296508789, -8.786434173583984, -5.85713005065918, -2.9278182983398438, 0.0014858245849609375, 2.9307899475097656, 5.86009407043457, 8.789398193359375, 11.71870231628418, 14.648006439208984, 17.57731056213379, 20.506614685058594, 23.4359188079834, 26.365222930908203, 29.294527053833008, 32.22383117675781, 35.15313720703125, 38.08243942260742, 41.011741638183594, 43.94104766845703, 46.87035369873047, 49.79965591430664, 52.72895812988281, 55.65826416015625, 58.58757019042969, 61.51687240600586, 64.44617462158203, 67.37548065185547, 70.3047866821289, 73.23408508300781, 76.16339111328125, 79.09269714355469, 82.02200317382812, 84.95130920410156, 87.88060760498047, 90.8099136352539]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0, 5.0, 2.0, 4.0, 9.0, 8.0, 6.0, 11.0, 16.0, 15.0, 20.0, 19.0, 29.0, 26.0, 33.0, 32.0, 35.0, 34.0, 43.0, 30.0, 43.0, 42.0, 30.0, 51.0, 29.0, 55.0, 36.0, 31.0, 34.0, 30.0, 31.0, 32.0, 22.0, 26.0, 19.0, 14.0, 21.0, 18.0, 17.0, 11.0, 12.0, 6.0, 3.0, 6.0, 6.0, 8.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.440338134765625, -39.168846130371094, -37.8973503112793, -36.625858306884766, -35.35436248779297, -34.08287048339844, -32.811378479003906, -31.539884567260742, -30.268390655517578, -28.996896743774414, -27.72540283203125, -26.45391082763672, -25.182416915893555, -23.91092300415039, -22.63943099975586, -21.367937088012695, -20.09644317626953, -18.824949264526367, -17.553455352783203, -16.281963348388672, -15.010469436645508, -13.738975524902344, -12.467482566833496, -11.195989608764648, -9.924495697021484, -8.65300178527832, -7.381508827209473, -6.110015392303467, -4.838521957397461, -3.567028522491455, -2.295535087585449, -1.0240421295166016, 0.2474517822265625, 1.5189452171325684, 2.790438652038574, 4.06193208694458, 5.333425521850586, 6.604918956756592, 7.876412391662598, 9.147905349731445, 10.41939926147461, 11.690893173217773, 12.962386131286621, 14.233879089355469, 15.505373001098633, 16.776866912841797, 18.048358917236328, 19.319852828979492, 20.591346740722656, 21.86284065246582, 23.134334564208984, 24.405826568603516, 25.67732048034668, 26.948814392089844, 28.220306396484375, 29.49180030822754, 30.763294219970703, 32.034786224365234, 33.30628204345703, 34.57777404785156, 35.849266052246094, 37.12076187133789, 38.39225387573242, 39.66374969482422, 40.93524169921875]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 6.0, 5.0, 7.0, 4.0, 3.0, 8.0, 5.0, 12.0, 15.0, 16.0, 18.0, 11.0, 23.0, 32.0, 28.0, 30.0, 21.0, 33.0, 46.0, 41.0, 40.0, 48.0, 38.0, 43.0, 44.0, 50.0, 40.0, 41.0, 41.0, 33.0, 23.0, 26.0, 28.0, 14.0, 23.0, 23.0, 18.0, 19.0, 9.0, 7.0, 9.0, 7.0, 4.0, 4.0, 7.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.921875, -5.71337890625, -5.5048828125, -5.29638671875, -5.087890625, -4.87939453125, -4.6708984375, -4.46240234375, -4.25390625, -4.04541015625, -3.8369140625, -3.62841796875, -3.419921875, -3.21142578125, -3.0029296875, -2.79443359375, -2.5859375, -2.37744140625, -2.1689453125, -1.96044921875, -1.751953125, -1.54345703125, -1.3349609375, -1.12646484375, -0.91796875, -0.70947265625, -0.5009765625, -0.29248046875, -0.083984375, 0.12451171875, 0.3330078125, 0.54150390625, 0.75, 0.95849609375, 1.1669921875, 1.37548828125, 1.583984375, 1.79248046875, 2.0009765625, 2.20947265625, 2.41796875, 2.62646484375, 2.8349609375, 3.04345703125, 3.251953125, 3.46044921875, 3.6689453125, 3.87744140625, 4.0859375, 4.29443359375, 4.5029296875, 4.71142578125, 4.919921875, 5.12841796875, 5.3369140625, 5.54541015625, 5.75390625, 5.96240234375, 6.1708984375, 6.37939453125, 6.587890625, 6.79638671875, 7.0048828125, 7.21337890625, 7.421875]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 4.0, 6.0, 12.0, 10.0, 22.0, 24.0, 52.0, 81.0, 118.0, 156.0, 279.0, 438.0, 682.0, 953.0, 1517.0, 2365.0, 3675.0, 5810.0, 9203.0, 14509.0, 23276.0, 37834.0, 61601.0, 98723.0, 147986.0, 184909.0, 159820.0, 111352.0, 69369.0, 42787.0, 26219.0, 16148.0, 10262.0, 6518.0, 4285.0, 2613.0, 1772.0, 1082.0, 724.0, 473.0, 305.0, 204.0, 138.0, 87.0, 53.0, 39.0, 21.0, 14.0, 16.0, 10.0, 3.0, 1.0, 3.0, 3.0], "bins": [-0.72900390625, -0.7085418701171875, -0.688079833984375, -0.6676177978515625, -0.64715576171875, -0.6266937255859375, -0.606231689453125, -0.5857696533203125, -0.5653076171875, -0.5448455810546875, -0.524383544921875, -0.5039215087890625, -0.48345947265625, -0.4629974365234375, -0.442535400390625, -0.4220733642578125, -0.401611328125, -0.3811492919921875, -0.360687255859375, -0.3402252197265625, -0.31976318359375, -0.2993011474609375, -0.278839111328125, -0.2583770751953125, -0.2379150390625, -0.2174530029296875, -0.196990966796875, -0.1765289306640625, -0.15606689453125, -0.1356048583984375, -0.115142822265625, -0.0946807861328125, -0.07421875, -0.0537567138671875, -0.033294677734375, -0.0128326416015625, 0.00762939453125, 0.0280914306640625, 0.048553466796875, 0.0690155029296875, 0.0894775390625, 0.1099395751953125, 0.130401611328125, 0.1508636474609375, 0.17132568359375, 0.1917877197265625, 0.212249755859375, 0.2327117919921875, 0.253173828125, 0.2736358642578125, 0.294097900390625, 0.3145599365234375, 0.33502197265625, 0.3554840087890625, 0.375946044921875, 0.3964080810546875, 0.4168701171875, 0.4373321533203125, 0.457794189453125, 0.4782562255859375, 0.49871826171875, 0.5191802978515625, 0.539642333984375, 0.5601043701171875, 0.58056640625]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 4.0, 1.0, 1.0, 4.0, 6.0, 3.0, 7.0, 4.0, 6.0, 14.0, 15.0, 11.0, 11.0, 17.0, 23.0, 25.0, 26.0, 25.0, 22.0, 21.0, 33.0, 26.0, 39.0, 45.0, 40.0, 35.0, 27.0, 1084.0, 27.0, 33.0, 46.0, 34.0, 27.0, 28.0, 30.0, 19.0, 22.0, 24.0, 25.0, 27.0, 17.0, 15.0, 17.0, 11.0, 14.0, 13.0, 12.0, 6.0, 2.0, 5.0, 1.0, 5.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.4765625, -3.36114501953125, -3.2457275390625, -3.13031005859375, -3.014892578125, -2.89947509765625, -2.7840576171875, -2.66864013671875, -2.55322265625, -2.43780517578125, -2.3223876953125, -2.20697021484375, -2.091552734375, -1.97613525390625, -1.8607177734375, -1.74530029296875, -1.6298828125, -1.51446533203125, -1.3990478515625, -1.28363037109375, -1.168212890625, -1.05279541015625, -0.9373779296875, -0.82196044921875, -0.70654296875, -0.59112548828125, -0.4757080078125, -0.36029052734375, -0.244873046875, -0.12945556640625, -0.0140380859375, 0.10137939453125, 0.216796875, 0.33221435546875, 0.4476318359375, 0.56304931640625, 0.678466796875, 0.79388427734375, 0.9093017578125, 1.02471923828125, 1.14013671875, 1.25555419921875, 1.3709716796875, 1.48638916015625, 1.601806640625, 1.71722412109375, 1.8326416015625, 1.94805908203125, 2.0634765625, 2.17889404296875, 2.2943115234375, 2.40972900390625, 2.525146484375, 2.64056396484375, 2.7559814453125, 2.87139892578125, 2.98681640625, 3.10223388671875, 3.2176513671875, 3.33306884765625, 3.448486328125, 3.56390380859375, 3.6793212890625, 3.79473876953125, 3.91015625]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 7.0, 11.0, 16.0, 27.0, 31.0, 53.0, 110.0, 177.0, 299.0, 533.0, 946.0, 1620.0, 2911.0, 4782.0, 8338.0, 13508.0, 22538.0, 37024.0, 60519.0, 97000.0, 143703.0, 1224228.0, 164383.0, 118833.0, 76963.0, 47148.0, 28668.0, 17491.0, 10565.0, 6140.0, 3560.0, 2031.0, 1282.0, 699.0, 411.0, 214.0, 161.0, 92.0, 31.0, 32.0, 17.0, 19.0, 5.0, 5.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.537109375, -0.5201873779296875, -0.503265380859375, -0.4863433837890625, -0.46942138671875, -0.4524993896484375, -0.435577392578125, -0.4186553955078125, -0.4017333984375, -0.3848114013671875, -0.367889404296875, -0.3509674072265625, -0.33404541015625, -0.3171234130859375, -0.300201416015625, -0.2832794189453125, -0.266357421875, -0.2494354248046875, -0.232513427734375, -0.2155914306640625, -0.19866943359375, -0.1817474365234375, -0.164825439453125, -0.1479034423828125, -0.1309814453125, -0.1140594482421875, -0.097137451171875, -0.0802154541015625, -0.06329345703125, -0.0463714599609375, -0.029449462890625, -0.0125274658203125, 0.00439453125, 0.0213165283203125, 0.038238525390625, 0.0551605224609375, 0.07208251953125, 0.0890045166015625, 0.105926513671875, 0.1228485107421875, 0.1397705078125, 0.1566925048828125, 0.173614501953125, 0.1905364990234375, 0.20745849609375, 0.2243804931640625, 0.241302490234375, 0.2582244873046875, 0.275146484375, 0.2920684814453125, 0.308990478515625, 0.3259124755859375, 0.34283447265625, 0.3597564697265625, 0.376678466796875, 0.3936004638671875, 0.4105224609375, 0.4274444580078125, 0.444366455078125, 0.4612884521484375, 0.47821044921875, 0.4951324462890625, 0.512054443359375, 0.5289764404296875, 0.5458984375]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 3.0, 2.0, 6.0, 2.0, 11.0, 5.0, 9.0, 7.0, 13.0, 17.0, 21.0, 15.0, 20.0, 25.0, 43.0, 53.0, 67.0, 56.0, 68.0, 75.0, 66.0, 61.0, 62.0, 60.0, 34.0, 28.0, 31.0, 21.0, 24.0, 15.0, 16.0, 16.0, 9.0, 16.0, 8.0, 6.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0], "bins": [-0.003993988037109375, -0.0038833022117614746, -0.0037726163864135742, -0.003661930561065674, -0.0035512447357177734, -0.003440558910369873, -0.0033298730850219727, -0.0032191872596740723, -0.003108501434326172, -0.0029978156089782715, -0.002887129783630371, -0.0027764439582824707, -0.0026657581329345703, -0.00255507230758667, -0.0024443864822387695, -0.002333700656890869, -0.0022230148315429688, -0.0021123290061950684, -0.002001643180847168, -0.0018909573554992676, -0.0017802715301513672, -0.0016695857048034668, -0.0015588998794555664, -0.001448214054107666, -0.0013375282287597656, -0.0012268424034118652, -0.0011161565780639648, -0.0010054707527160645, -0.0008947849273681641, -0.0007840991020202637, -0.0006734132766723633, -0.0005627274513244629, -0.0004520416259765625, -0.0003413558006286621, -0.00023066997528076172, -0.00011998414993286133, -9.298324584960938e-06, 0.00010138750076293945, 0.00021207332611083984, 0.00032275915145874023, 0.0004334449768066406, 0.000544130802154541, 0.0006548166275024414, 0.0007655024528503418, 0.0008761882781982422, 0.0009868741035461426, 0.001097559928894043, 0.0012082457542419434, 0.0013189315795898438, 0.0014296174049377441, 0.0015403032302856445, 0.001650989055633545, 0.0017616748809814453, 0.0018723607063293457, 0.001983046531677246, 0.0020937323570251465, 0.002204418182373047, 0.0023151040077209473, 0.0024257898330688477, 0.002536475658416748, 0.0026471614837646484, 0.002757847309112549, 0.0028685331344604492, 0.0029792189598083496, 0.00308990478515625]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 5.0, 11.0, 16.0, 16.0, 14.0, 21.0, 28.0, 46.0, 40.0, 68.0, 80.0, 107.0, 238.0, 1016.0, 47103.0, 990464.0, 8096.0, 524.0, 197.0, 116.0, 96.0, 51.0, 43.0, 24.0, 27.0, 12.0, 17.0, 14.0, 12.0, 6.0, 7.0, 8.0, 9.0, 6.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.06951904296875, -0.0668783187866211, -0.06423759460449219, -0.06159687042236328, -0.058956146240234375, -0.05631542205810547, -0.05367469787597656, -0.051033973693847656, -0.04839324951171875, -0.045752525329589844, -0.04311180114746094, -0.04047107696533203, -0.037830352783203125, -0.03518962860107422, -0.03254890441894531, -0.029908180236816406, -0.0272674560546875, -0.024626731872558594, -0.021986007690429688, -0.01934528350830078, -0.016704559326171875, -0.014063835144042969, -0.011423110961914062, -0.008782386779785156, -0.00614166259765625, -0.0035009384155273438, -0.0008602142333984375, 0.0017805099487304688, 0.004421234130859375, 0.007061958312988281, 0.009702682495117188, 0.012343406677246094, 0.014984130859375, 0.017624855041503906, 0.020265579223632812, 0.02290630340576172, 0.025547027587890625, 0.02818775177001953, 0.030828475952148438, 0.033469200134277344, 0.03610992431640625, 0.038750648498535156, 0.04139137268066406, 0.04403209686279297, 0.046672821044921875, 0.04931354522705078, 0.05195426940917969, 0.054594993591308594, 0.0572357177734375, 0.059876441955566406, 0.06251716613769531, 0.06515789031982422, 0.06779861450195312, 0.07043933868408203, 0.07308006286621094, 0.07572078704833984, 0.07836151123046875, 0.08100223541259766, 0.08364295959472656, 0.08628368377685547, 0.08892440795898438, 0.09156513214111328, 0.09420585632324219, 0.0968465805053711, 0.0994873046875]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 38.0, 518.0, 418.0, 34.0, 6.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002878597006201744, -0.0021503595635294914, -0.0014221223536878824, -0.0006938851438462734, 3.435229882597923e-05, 0.0007625897414982319, 0.0014908267185091972, 0.00221906416118145, 0.0029473016038537025, 0.003675539046525955, 0.004403776489198208, 0.005132013466209173, 0.005860250908881426, 0.0065884883515536785, 0.007316725328564644, 0.008044962771236897, 0.00877320021390915, 0.009501437656581402, 0.010229675099253654, 0.010957911610603333, 0.01168614998459816, 0.012414386495947838, 0.01314262393862009, 0.013870861381292343, 0.014599098823964596, 0.015327336266636848, 0.016055572777986526, 0.016783811151981354, 0.017512047663331032, 0.01824028603732586, 0.018968522548675537, 0.019696760922670364, 0.02042499929666519, 0.02115323580801487, 0.021881474182009697, 0.022609710693359375, 0.023337949067354202, 0.02406618557870388, 0.02479442209005356, 0.025522660464048386, 0.026250898838043213, 0.02697913534939289, 0.027707373723387718, 0.028435610234737396, 0.029163848608732224, 0.0298920851200819, 0.03062032163143158, 0.03134856000542641, 0.032076798379421234, 0.03280503675341606, 0.03353327140212059, 0.03426150977611542, 0.034989748150110245, 0.03571798652410507, 0.0364462211728096, 0.03717445954680443, 0.03790269419550896, 0.038630932569503784, 0.03935916721820831, 0.04008740559220314, 0.04081564396619797, 0.041543882340192795, 0.042272116988897324, 0.04300035536289215, 0.04372859373688698]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 5.0, 7.0, 12.0, 16.0, 15.0, 26.0, 28.0, 33.0, 37.0, 39.0, 56.0, 63.0, 63.0, 62.0, 61.0, 76.0, 70.0, 67.0, 42.0, 45.0, 57.0, 26.0, 19.0, 21.0, 15.0, 17.0, 9.0, 8.0, 8.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00315779447555542, -0.0030496595427393913, -0.0029415246099233627, -0.002833389677107334, -0.0027252547442913055, -0.002617119811475277, -0.0025089848786592484, -0.0024008499458432198, -0.002292715013027191, -0.0021845800802111626, -0.002076445147395134, -0.0019683102145791054, -0.0018601752817630768, -0.0017520403489470482, -0.0016439054161310196, -0.001535770483314991, -0.0014276355504989624, -0.0013195006176829338, -0.0012113656848669052, -0.0011032307520508766, -0.000995095819234848, -0.0008869608864188194, -0.0007788259536027908, -0.0006706910207867622, -0.0005625560879707336, -0.00045442115515470505, -0.00034628622233867645, -0.00023815128952264786, -0.00013001635670661926, -2.1881423890590668e-05, 8.625350892543793e-05, 0.00019438844174146652, 0.0003025233745574951, 0.0004106583073735237, 0.0005187932401895523, 0.0006269281730055809, 0.0007350631058216095, 0.0008431980386376381, 0.0009513329714536667, 0.0010594679042696953, 0.0011676028370857239, 0.0012757377699017525, 0.001383872702717781, 0.0014920076355338097, 0.0016001425683498383, 0.0017082775011658669, 0.0018164124339818954, 0.001924547366797924, 0.0020326822996139526, 0.0021408172324299812, 0.00224895216524601, 0.0023570870980620384, 0.002465222030878067, 0.0025733569636940956, 0.002681491896510124, 0.002789626829326153, 0.0028977617621421814, 0.00300589669495821, 0.0031140316277742386, 0.003222166560590267, 0.0033303014934062958, 0.0034384364262223244, 0.003546571359038353, 0.0036547062918543816, 0.00376284122467041]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 6.0, 5.0, 7.0, 4.0, 3.0, 8.0, 5.0, 12.0, 15.0, 16.0, 18.0, 11.0, 23.0, 32.0, 28.0, 30.0, 21.0, 33.0, 46.0, 41.0, 40.0, 48.0, 38.0, 43.0, 44.0, 50.0, 40.0, 41.0, 41.0, 32.0, 24.0, 26.0, 28.0, 14.0, 23.0, 23.0, 18.0, 19.0, 9.0, 7.0, 9.0, 7.0, 4.0, 4.0, 7.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.921875, -5.71337890625, -5.5048828125, -5.29638671875, -5.087890625, -4.87939453125, -4.6708984375, -4.46240234375, -4.25390625, -4.04541015625, -3.8369140625, -3.62841796875, -3.419921875, -3.21142578125, -3.0029296875, -2.79443359375, -2.5859375, -2.37744140625, -2.1689453125, -1.96044921875, -1.751953125, -1.54345703125, -1.3349609375, -1.12646484375, -0.91796875, -0.70947265625, -0.5009765625, -0.29248046875, -0.083984375, 0.12451171875, 0.3330078125, 0.54150390625, 0.75, 0.95849609375, 1.1669921875, 1.37548828125, 1.583984375, 1.79248046875, 2.0009765625, 2.20947265625, 2.41796875, 2.62646484375, 2.8349609375, 3.04345703125, 3.251953125, 3.46044921875, 3.6689453125, 3.87744140625, 4.0859375, 4.29443359375, 4.5029296875, 4.71142578125, 4.919921875, 5.12841796875, 5.3369140625, 5.54541015625, 5.75390625, 5.96240234375, 6.1708984375, 6.37939453125, 6.587890625, 6.79638671875, 7.0048828125, 7.21337890625, 7.421875]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 1.0, 8.0, 8.0, 11.0, 7.0, 18.0, 23.0, 34.0, 32.0, 53.0, 57.0, 81.0, 125.0, 171.0, 283.0, 430.0, 882.0, 1753.0, 3752.0, 8442.0, 20365.0, 53640.0, 156912.0, 488872.0, 202755.0, 65841.0, 24978.0, 10138.0, 4431.0, 2025.0, 934.0, 495.0, 320.0, 203.0, 132.0, 81.0, 57.0, 50.0, 40.0, 29.0, 27.0, 17.0, 13.0, 10.0, 6.0, 4.0, 3.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-6.41796875, -6.208251953125, -5.99853515625, -5.788818359375, -5.5791015625, -5.369384765625, -5.15966796875, -4.949951171875, -4.740234375, -4.530517578125, -4.32080078125, -4.111083984375, -3.9013671875, -3.691650390625, -3.48193359375, -3.272216796875, -3.0625, -2.852783203125, -2.64306640625, -2.433349609375, -2.2236328125, -2.013916015625, -1.80419921875, -1.594482421875, -1.384765625, -1.175048828125, -0.96533203125, -0.755615234375, -0.5458984375, -0.336181640625, -0.12646484375, 0.083251953125, 0.29296875, 0.502685546875, 0.71240234375, 0.922119140625, 1.1318359375, 1.341552734375, 1.55126953125, 1.760986328125, 1.970703125, 2.180419921875, 2.39013671875, 2.599853515625, 2.8095703125, 3.019287109375, 3.22900390625, 3.438720703125, 3.6484375, 3.858154296875, 4.06787109375, 4.277587890625, 4.4873046875, 4.697021484375, 4.90673828125, 5.116455078125, 5.326171875, 5.535888671875, 5.74560546875, 5.955322265625, 6.1650390625, 6.374755859375, 6.58447265625, 6.794189453125, 7.00390625]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 2.0, 2.0, 10.0, 10.0, 7.0, 7.0, 6.0, 8.0, 15.0, 16.0, 19.0, 14.0, 33.0, 30.0, 30.0, 31.0, 39.0, 34.0, 56.0, 50.0, 109.0, 384.0, 1582.0, 110.0, 59.0, 55.0, 42.0, 36.0, 42.0, 25.0, 23.0, 24.0, 16.0, 14.0, 13.0, 25.0, 14.0, 13.0, 8.0, 7.0, 5.0, 7.0, 5.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.828125, -18.22216796875, -17.6162109375, -17.01025390625, -16.404296875, -15.79833984375, -15.1923828125, -14.58642578125, -13.98046875, -13.37451171875, -12.7685546875, -12.16259765625, -11.556640625, -10.95068359375, -10.3447265625, -9.73876953125, -9.1328125, -8.52685546875, -7.9208984375, -7.31494140625, -6.708984375, -6.10302734375, -5.4970703125, -4.89111328125, -4.28515625, -3.67919921875, -3.0732421875, -2.46728515625, -1.861328125, -1.25537109375, -0.6494140625, -0.04345703125, 0.5625, 1.16845703125, 1.7744140625, 2.38037109375, 2.986328125, 3.59228515625, 4.1982421875, 4.80419921875, 5.41015625, 6.01611328125, 6.6220703125, 7.22802734375, 7.833984375, 8.43994140625, 9.0458984375, 9.65185546875, 10.2578125, 10.86376953125, 11.4697265625, 12.07568359375, 12.681640625, 13.28759765625, 13.8935546875, 14.49951171875, 15.10546875, 15.71142578125, 16.3173828125, 16.92333984375, 17.529296875, 18.13525390625, 18.7412109375, 19.34716796875, 19.953125]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 3.0, 2.0, 1.0, 3.0, 4.0, 3.0, 4.0, 1.0, 8.0, 7.0, 16.0, 11.0, 17.0, 19.0, 26.0, 31.0, 30.0, 35.0, 45.0, 72.0, 90.0, 143.0, 218.0, 326.0, 663.0, 1176.0, 6112.0, 2706212.0, 424309.0, 3461.0, 1071.0, 562.0, 300.0, 182.0, 141.0, 87.0, 68.0, 35.0, 42.0, 42.0, 24.0, 8.0, 23.0, 22.0, 13.0, 10.0, 4.0, 8.0, 8.0, 4.0, 0.0, 5.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-45.71875, -44.28564453125, -42.8525390625, -41.41943359375, -39.986328125, -38.55322265625, -37.1201171875, -35.68701171875, -34.25390625, -32.82080078125, -31.3876953125, -29.95458984375, -28.521484375, -27.08837890625, -25.6552734375, -24.22216796875, -22.7890625, -21.35595703125, -19.9228515625, -18.48974609375, -17.056640625, -15.62353515625, -14.1904296875, -12.75732421875, -11.32421875, -9.89111328125, -8.4580078125, -7.02490234375, -5.591796875, -4.15869140625, -2.7255859375, -1.29248046875, 0.140625, 1.57373046875, 3.0068359375, 4.43994140625, 5.873046875, 7.30615234375, 8.7392578125, 10.17236328125, 11.60546875, 13.03857421875, 14.4716796875, 15.90478515625, 17.337890625, 18.77099609375, 20.2041015625, 21.63720703125, 23.0703125, 24.50341796875, 25.9365234375, 27.36962890625, 28.802734375, 30.23583984375, 31.6689453125, 33.10205078125, 34.53515625, 35.96826171875, 37.4013671875, 38.83447265625, 40.267578125, 41.70068359375, 43.1337890625, 44.56689453125, 46.0]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 22.0, 42.0, 62.0, 84.0, 107.0, 155.0, 175.0, 126.0, 85.0, 69.0, 38.0, 20.0, 4.0, 6.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-36.023704528808594, -35.27062225341797, -34.51754379272461, -33.764461517333984, -33.011383056640625, -32.25830078125, -31.505218505859375, -30.752138137817383, -29.99905776977539, -29.2459774017334, -28.492897033691406, -27.73981475830078, -26.98673439025879, -26.233654022216797, -25.480571746826172, -24.72749137878418, -23.974411010742188, -23.221330642700195, -22.468250274658203, -21.715167999267578, -20.962087631225586, -20.209007263183594, -19.45592498779297, -18.702844619750977, -17.949764251708984, -17.196683883666992, -16.443603515625, -15.690521240234375, -14.937440872192383, -14.18436050415039, -13.431279182434082, -12.678197860717773, -11.925118446350098, -11.172037124633789, -10.418956756591797, -9.665876388549805, -8.912795066833496, -8.159713745117188, -7.406633377075195, -6.653552532196045, -5.9004716873168945, -5.147390842437744, -4.394309997558594, -3.6412291526794434, -2.888148307800293, -2.1350674629211426, -1.3819866180419922, -0.6289057731628418, 0.1241750717163086, 0.877255916595459, 1.6303367614746094, 2.3834176063537598, 3.13649845123291, 3.8895792961120605, 4.642660140991211, 5.395740985870361, 6.148821830749512, 6.901902675628662, 7.6549835205078125, 8.408063888549805, 9.161145210266113, 9.914226531982422, 10.667306900024414, 11.420387268066406, 12.173468589782715]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 6.0, 8.0, 5.0, 15.0, 9.0, 11.0, 18.0, 14.0, 10.0, 11.0, 23.0, 19.0, 19.0, 29.0, 21.0, 24.0, 42.0, 29.0, 32.0, 45.0, 43.0, 33.0, 31.0, 36.0, 34.0, 38.0, 30.0, 40.0, 33.0, 36.0, 26.0, 26.0, 23.0, 17.0, 17.0, 18.0, 20.0, 14.0, 22.0, 15.0, 16.0, 11.0, 6.0, 12.0, 6.0, 2.0, 3.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-46.38966751098633, -44.90962600708008, -43.42958450317383, -41.94954299926758, -40.46950149536133, -38.98945999145508, -37.50941848754883, -36.02937698364258, -34.54933547973633, -33.06929397583008, -31.589252471923828, -30.109210968017578, -28.629169464111328, -27.149127960205078, -25.669086456298828, -24.189044952392578, -22.709001541137695, -21.228960037231445, -19.748918533325195, -18.268877029418945, -16.788835525512695, -15.308794021606445, -13.828751564025879, -12.348710060119629, -10.868668556213379, -9.388627052307129, -7.908585548400879, -6.428543567657471, -4.948502063751221, -3.4684605598449707, -1.9884185791015625, -0.5083770751953125, 0.9716644287109375, 2.4517059326171875, 3.9317476749420166, 5.411789417266846, 6.891830921173096, 8.371871948242188, 9.851914405822754, 11.331955909729004, 12.811997413635254, 14.292038917541504, 15.772080421447754, 17.25212287902832, 18.73216438293457, 20.21220588684082, 21.69224739074707, 23.17228889465332, 24.65233039855957, 26.13237190246582, 27.61241340637207, 29.09245491027832, 30.57249641418457, 32.05253982543945, 33.5325813293457, 35.01262283325195, 36.4926643371582, 37.97270584106445, 39.4527473449707, 40.93278884887695, 42.4128303527832, 43.89287185668945, 45.3729133605957, 46.85295486450195, 48.3329963684082]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 7.0, 1.0, 6.0, 3.0, 5.0, 6.0, 9.0, 9.0, 9.0, 20.0, 19.0, 16.0, 28.0, 27.0, 19.0, 35.0, 23.0, 30.0, 40.0, 42.0, 43.0, 65.0, 37.0, 39.0, 47.0, 45.0, 50.0, 34.0, 36.0, 33.0, 29.0, 25.0, 17.0, 21.0, 23.0, 22.0, 13.0, 20.0, 8.0, 8.0, 15.0, 3.0, 5.0, 6.0, 5.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.09375, -5.87109375, -5.6484375, -5.42578125, -5.203125, -4.98046875, -4.7578125, -4.53515625, -4.3125, -4.08984375, -3.8671875, -3.64453125, -3.421875, -3.19921875, -2.9765625, -2.75390625, -2.53125, -2.30859375, -2.0859375, -1.86328125, -1.640625, -1.41796875, -1.1953125, -0.97265625, -0.75, -0.52734375, -0.3046875, -0.08203125, 0.140625, 0.36328125, 0.5859375, 0.80859375, 1.03125, 1.25390625, 1.4765625, 1.69921875, 1.921875, 2.14453125, 2.3671875, 2.58984375, 2.8125, 3.03515625, 3.2578125, 3.48046875, 3.703125, 3.92578125, 4.1484375, 4.37109375, 4.59375, 4.81640625, 5.0390625, 5.26171875, 5.484375, 5.70703125, 5.9296875, 6.15234375, 6.375, 6.59765625, 6.8203125, 7.04296875, 7.265625, 7.48828125, 7.7109375, 7.93359375, 8.15625]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 4.0, 2.0, 2.0, 5.0, 3.0, 3.0, 7.0, 2.0, 13.0, 12.0, 18.0, 12.0, 35.0, 29.0, 43.0, 29.0, 57.0, 95.0, 120.0, 246.0, 557.0, 1970.0, 11276.0, 205060.0, 3335625.0, 613287.0, 20985.0, 3108.0, 824.0, 296.0, 169.0, 97.0, 73.0, 43.0, 30.0, 31.0, 24.0, 26.0, 16.0, 12.0, 13.0, 4.0, 8.0, 6.0, 4.0, 5.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.5625, -18.828125, -18.09375, -17.359375, -16.625, -15.890625, -15.15625, -14.421875, -13.6875, -12.953125, -12.21875, -11.484375, -10.75, -10.015625, -9.28125, -8.546875, -7.8125, -7.078125, -6.34375, -5.609375, -4.875, -4.140625, -3.40625, -2.671875, -1.9375, -1.203125, -0.46875, 0.265625, 1.0, 1.734375, 2.46875, 3.203125, 3.9375, 4.671875, 5.40625, 6.140625, 6.875, 7.609375, 8.34375, 9.078125, 9.8125, 10.546875, 11.28125, 12.015625, 12.75, 13.484375, 14.21875, 14.953125, 15.6875, 16.421875, 17.15625, 17.890625, 18.625, 19.359375, 20.09375, 20.828125, 21.5625, 22.296875, 23.03125, 23.765625, 24.5, 25.234375, 25.96875, 26.703125, 27.4375]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 8.0, 7.0, 7.0, 7.0, 13.0, 14.0, 16.0, 38.0, 35.0, 55.0, 76.0, 91.0, 140.0, 197.0, 271.0, 377.0, 507.0, 531.0, 475.0, 380.0, 262.0, 146.0, 125.0, 88.0, 46.0, 40.0, 38.0, 30.0, 17.0, 12.0, 13.0, 3.0, 7.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.7578125, -13.3326416015625, -12.907470703125, -12.4822998046875, -12.05712890625, -11.6319580078125, -11.206787109375, -10.7816162109375, -10.3564453125, -9.9312744140625, -9.506103515625, -9.0809326171875, -8.65576171875, -8.2305908203125, -7.805419921875, -7.3802490234375, -6.955078125, -6.5299072265625, -6.104736328125, -5.6795654296875, -5.25439453125, -4.8292236328125, -4.404052734375, -3.9788818359375, -3.5537109375, -3.1285400390625, -2.703369140625, -2.2781982421875, -1.85302734375, -1.4278564453125, -1.002685546875, -0.5775146484375, -0.15234375, 0.2728271484375, 0.697998046875, 1.1231689453125, 1.54833984375, 1.9735107421875, 2.398681640625, 2.8238525390625, 3.2490234375, 3.6741943359375, 4.099365234375, 4.5245361328125, 4.94970703125, 5.3748779296875, 5.800048828125, 6.2252197265625, 6.650390625, 7.0755615234375, 7.500732421875, 7.9259033203125, 8.35107421875, 8.7762451171875, 9.201416015625, 9.6265869140625, 10.0517578125, 10.4769287109375, 10.902099609375, 11.3272705078125, 11.75244140625, 12.1776123046875, 12.602783203125, 13.0279541015625, 13.453125]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 8.0, 7.0, 13.0, 14.0, 25.0, 32.0, 46.0, 50.0, 74.0, 117.0, 156.0, 257.0, 317.0, 623.0, 5154.0, 3121429.0, 1061055.0, 3227.0, 495.0, 302.0, 248.0, 165.0, 120.0, 114.0, 68.0, 52.0, 38.0, 22.0, 11.0, 10.0, 15.0, 5.0, 6.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.375, -72.0458984375, -69.716796875, -67.3876953125, -65.05859375, -62.7294921875, -60.400390625, -58.0712890625, -55.7421875, -53.4130859375, -51.083984375, -48.7548828125, -46.42578125, -44.0966796875, -41.767578125, -39.4384765625, -37.109375, -34.7802734375, -32.451171875, -30.1220703125, -27.79296875, -25.4638671875, -23.134765625, -20.8056640625, -18.4765625, -16.1474609375, -13.818359375, -11.4892578125, -9.16015625, -6.8310546875, -4.501953125, -2.1728515625, 0.15625, 2.4853515625, 4.814453125, 7.1435546875, 9.47265625, 11.8017578125, 14.130859375, 16.4599609375, 18.7890625, 21.1181640625, 23.447265625, 25.7763671875, 28.10546875, 30.4345703125, 32.763671875, 35.0927734375, 37.421875, 39.7509765625, 42.080078125, 44.4091796875, 46.73828125, 49.0673828125, 51.396484375, 53.7255859375, 56.0546875, 58.3837890625, 60.712890625, 63.0419921875, 65.37109375, 67.7001953125, 70.029296875, 72.3583984375, 74.6875]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 11.0, 30.0, 92.0, 202.0, 281.0, 206.0, 116.0, 45.0, 19.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-171.51287841796875, -168.0595703125, -164.60626220703125, -161.15296936035156, -157.6996612548828, -154.24635314941406, -150.7930450439453, -147.33973693847656, -143.88644409179688, -140.43313598632812, -136.97982788085938, -133.5265350341797, -130.07322692871094, -126.61991882324219, -123.16661071777344, -119.71331024169922, -116.25999450683594, -112.80668640136719, -109.35338592529297, -105.90007781982422, -102.44677734375, -98.99346923828125, -95.5401611328125, -92.08686065673828, -88.63356018066406, -85.18025207519531, -81.7269515991211, -78.27364349365234, -74.82034301757812, -71.36703491210938, -67.91372680664062, -64.4604263305664, -61.007118225097656, -57.55381393432617, -54.10050964355469, -50.64720153808594, -47.19389724731445, -43.74059295654297, -40.287288665771484, -36.833984375, -33.38067626953125, -29.927371978759766, -26.47406578063965, -23.020761489868164, -19.567455291748047, -16.114151000976562, -12.660846710205078, -9.207540512084961, -5.754238128662109, -2.3009331226348877, 1.152371883392334, 4.605676651000977, 8.058981895446777, 11.512287139892578, 14.965591430664062, 18.41889762878418, 21.872201919555664, 25.32550621032715, 28.778812408447266, 32.23211669921875, 35.685420989990234, 39.13872528076172, 42.59203338623047, 46.04533767700195, 49.49864196777344]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 6.0, 5.0, 2.0, 11.0, 15.0, 17.0, 13.0, 17.0, 18.0, 19.0, 15.0, 20.0, 24.0, 28.0, 33.0, 31.0, 31.0, 39.0, 45.0, 37.0, 54.0, 38.0, 47.0, 51.0, 36.0, 38.0, 37.0, 24.0, 30.0, 31.0, 19.0, 20.0, 22.0, 13.0, 23.0, 14.0, 18.0, 17.0, 10.0, 10.0, 6.0, 4.0, 6.0, 7.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-38.41998291015625, -37.218482971191406, -36.01698303222656, -34.81548309326172, -33.613983154296875, -32.412479400634766, -31.210979461669922, -30.009479522705078, -28.807979583740234, -27.60647964477539, -26.404979705810547, -25.20347785949707, -24.001977920532227, -22.800477981567383, -21.598976135253906, -20.397476196289062, -19.19597625732422, -17.994476318359375, -16.79297637939453, -15.591474533081055, -14.389974594116211, -13.188474655151367, -11.986973762512207, -10.785472869873047, -9.583972930908203, -8.38247299194336, -7.180972099304199, -5.979471683502197, -4.777971267700195, -3.5764708518981934, -2.3749704360961914, -1.1734695434570312, 0.0280303955078125, 1.2295308113098145, 2.4310312271118164, 3.6325316429138184, 4.83403205871582, 6.035532474517822, 7.237032890319824, 8.438533782958984, 9.640033721923828, 10.841533660888672, 12.043034553527832, 13.244535446166992, 14.446035385131836, 15.64753532409668, 16.849037170410156, 18.050537109375, 19.252037048339844, 20.453536987304688, 21.65503692626953, 22.856538772583008, 24.05803871154785, 25.259538650512695, 26.461040496826172, 27.662540435791016, 28.86404037475586, 30.065540313720703, 31.267040252685547, 32.46854019165039, 33.6700439453125, 34.871543884277344, 36.07304382324219, 37.27454376220703, 38.476043701171875]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 6.0, 7.0, 10.0, 5.0, 9.0, 7.0, 12.0, 10.0, 13.0, 15.0, 21.0, 27.0, 29.0, 22.0, 36.0, 27.0, 34.0, 42.0, 48.0, 41.0, 41.0, 50.0, 30.0, 44.0, 40.0, 41.0, 42.0, 30.0, 36.0, 31.0, 26.0, 23.0, 21.0, 20.0, 19.0, 10.0, 17.0, 9.0, 11.0, 7.0, 10.0, 4.0, 6.0, 5.0, 4.0, 2.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.3359375, -6.125, -5.9140625, -5.703125, -5.4921875, -5.28125, -5.0703125, -4.859375, -4.6484375, -4.4375, -4.2265625, -4.015625, -3.8046875, -3.59375, -3.3828125, -3.171875, -2.9609375, -2.75, -2.5390625, -2.328125, -2.1171875, -1.90625, -1.6953125, -1.484375, -1.2734375, -1.0625, -0.8515625, -0.640625, -0.4296875, -0.21875, -0.0078125, 0.203125, 0.4140625, 0.625, 0.8359375, 1.046875, 1.2578125, 1.46875, 1.6796875, 1.890625, 2.1015625, 2.3125, 2.5234375, 2.734375, 2.9453125, 3.15625, 3.3671875, 3.578125, 3.7890625, 4.0, 4.2109375, 4.421875, 4.6328125, 4.84375, 5.0546875, 5.265625, 5.4765625, 5.6875, 5.8984375, 6.109375, 6.3203125, 6.53125, 6.7421875, 6.953125, 7.1640625]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 3.0, 16.0, 26.0, 26.0, 52.0, 67.0, 100.0, 174.0, 260.0, 418.0, 710.0, 1189.0, 1977.0, 3160.0, 5145.0, 8273.0, 12600.0, 20089.0, 31966.0, 52147.0, 85864.0, 137606.0, 187584.0, 177016.0, 122884.0, 76292.0, 45968.0, 28269.0, 17873.0, 11415.0, 7367.0, 4664.0, 2928.0, 1660.0, 1098.0, 649.0, 414.0, 232.0, 141.0, 76.0, 53.0, 35.0, 30.0, 16.0, 14.0, 4.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.7509765625, -0.7281341552734375, -0.705291748046875, -0.6824493408203125, -0.65960693359375, -0.6367645263671875, -0.613922119140625, -0.5910797119140625, -0.5682373046875, -0.5453948974609375, -0.522552490234375, -0.4997100830078125, -0.47686767578125, -0.4540252685546875, -0.431182861328125, -0.4083404541015625, -0.385498046875, -0.3626556396484375, -0.339813232421875, -0.3169708251953125, -0.29412841796875, -0.2712860107421875, -0.248443603515625, -0.2256011962890625, -0.2027587890625, -0.1799163818359375, -0.157073974609375, -0.1342315673828125, -0.11138916015625, -0.0885467529296875, -0.065704345703125, -0.0428619384765625, -0.02001953125, 0.0028228759765625, 0.025665283203125, 0.0485076904296875, 0.07135009765625, 0.0941925048828125, 0.117034912109375, 0.1398773193359375, 0.1627197265625, 0.1855621337890625, 0.208404541015625, 0.2312469482421875, 0.25408935546875, 0.2769317626953125, 0.299774169921875, 0.3226165771484375, 0.345458984375, 0.3683013916015625, 0.391143798828125, 0.4139862060546875, 0.43682861328125, 0.4596710205078125, 0.482513427734375, 0.5053558349609375, 0.5281982421875, 0.5510406494140625, 0.573883056640625, 0.5967254638671875, 0.61956787109375, 0.6424102783203125, 0.665252685546875, 0.6880950927734375, 0.7109375]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 3.0, 6.0, 8.0, 14.0, 18.0, 12.0, 14.0, 18.0, 17.0, 21.0, 20.0, 23.0, 28.0, 45.0, 35.0, 29.0, 35.0, 34.0, 55.0, 48.0, 1061.0, 39.0, 45.0, 47.0, 38.0, 43.0, 33.0, 31.0, 32.0, 23.0, 21.0, 21.0, 12.0, 17.0, 7.0, 12.0, 12.0, 11.0, 13.0, 4.0, 5.0, 4.0, 4.0, 3.0, 3.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.12109375, -3.98590087890625, -3.8507080078125, -3.71551513671875, -3.580322265625, -3.44512939453125, -3.3099365234375, -3.17474365234375, -3.03955078125, -2.90435791015625, -2.7691650390625, -2.63397216796875, -2.498779296875, -2.36358642578125, -2.2283935546875, -2.09320068359375, -1.9580078125, -1.82281494140625, -1.6876220703125, -1.55242919921875, -1.417236328125, -1.28204345703125, -1.1468505859375, -1.01165771484375, -0.87646484375, -0.74127197265625, -0.6060791015625, -0.47088623046875, -0.335693359375, -0.20050048828125, -0.0653076171875, 0.06988525390625, 0.205078125, 0.34027099609375, 0.4754638671875, 0.61065673828125, 0.745849609375, 0.88104248046875, 1.0162353515625, 1.15142822265625, 1.28662109375, 1.42181396484375, 1.5570068359375, 1.69219970703125, 1.827392578125, 1.96258544921875, 2.0977783203125, 2.23297119140625, 2.3681640625, 2.50335693359375, 2.6385498046875, 2.77374267578125, 2.908935546875, 3.04412841796875, 3.1793212890625, 3.31451416015625, 3.44970703125, 3.58489990234375, 3.7200927734375, 3.85528564453125, 3.990478515625, 4.12567138671875, 4.2608642578125, 4.39605712890625, 4.53125]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 8.0, 3.0, 9.0, 18.0, 19.0, 25.0, 66.0, 97.0, 153.0, 249.0, 440.0, 731.0, 1157.0, 1952.0, 3181.0, 5565.0, 9110.0, 15496.0, 25759.0, 43715.0, 71316.0, 112372.0, 159275.0, 1227935.0, 151684.0, 104017.0, 65222.0, 39335.0, 23240.0, 14023.0, 8394.0, 5032.0, 3048.0, 1811.0, 1042.0, 643.0, 376.0, 218.0, 165.0, 83.0, 49.0, 46.0, 23.0, 21.0, 4.0, 8.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.578125, -0.5597152709960938, -0.5413055419921875, -0.5228958129882812, -0.504486083984375, -0.48607635498046875, -0.4676666259765625, -0.44925689697265625, -0.43084716796875, -0.41243743896484375, -0.3940277099609375, -0.37561798095703125, -0.357208251953125, -0.33879852294921875, -0.3203887939453125, -0.30197906494140625, -0.2835693359375, -0.26515960693359375, -0.2467498779296875, -0.22834014892578125, -0.209930419921875, -0.19152069091796875, -0.1731109619140625, -0.15470123291015625, -0.13629150390625, -0.11788177490234375, -0.0994720458984375, -0.08106231689453125, -0.062652587890625, -0.04424285888671875, -0.0258331298828125, -0.00742340087890625, 0.010986328125, 0.02939605712890625, 0.0478057861328125, 0.06621551513671875, 0.084625244140625, 0.10303497314453125, 0.1214447021484375, 0.13985443115234375, 0.15826416015625, 0.17667388916015625, 0.1950836181640625, 0.21349334716796875, 0.231903076171875, 0.25031280517578125, 0.2687225341796875, 0.28713226318359375, 0.3055419921875, 0.32395172119140625, 0.3423614501953125, 0.36077117919921875, 0.379180908203125, 0.39759063720703125, 0.4160003662109375, 0.43441009521484375, 0.45281982421875, 0.47122955322265625, 0.4896392822265625, 0.5080490112304688, 0.526458740234375, 0.5448684692382812, 0.5632781982421875, 0.5816879272460938, 0.60009765625]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 2.0, 1.0, 2.0, 4.0, 2.0, 1.0, 6.0, 8.0, 5.0, 11.0, 10.0, 20.0, 21.0, 22.0, 32.0, 29.0, 38.0, 39.0, 43.0, 45.0, 43.0, 62.0, 68.0, 74.0, 69.0, 50.0, 35.0, 36.0, 39.0, 34.0, 28.0, 27.0, 21.0, 18.0, 15.0, 5.0, 10.0, 6.0, 9.0, 4.0, 2.0, 2.0, 4.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.003307342529296875, -0.0032024383544921875, -0.0030975341796875, -0.0029926300048828125, -0.002887725830078125, -0.0027828216552734375, -0.00267791748046875, -0.0025730133056640625, -0.002468109130859375, -0.0023632049560546875, -0.00225830078125, -0.0021533966064453125, -0.002048492431640625, -0.0019435882568359375, -0.00183868408203125, -0.0017337799072265625, -0.001628875732421875, -0.0015239715576171875, -0.0014190673828125, -0.0013141632080078125, -0.001209259033203125, -0.0011043548583984375, -0.00099945068359375, -0.0008945465087890625, -0.000789642333984375, -0.0006847381591796875, -0.000579833984375, -0.0004749298095703125, -0.000370025634765625, -0.0002651214599609375, -0.00016021728515625, -5.53131103515625e-05, 4.9591064453125e-05, 0.0001544952392578125, 0.0002593994140625, 0.0003643035888671875, 0.000469207763671875, 0.0005741119384765625, 0.00067901611328125, 0.0007839202880859375, 0.000888824462890625, 0.0009937286376953125, 0.0010986328125, 0.0012035369873046875, 0.001308441162109375, 0.0014133453369140625, 0.00151824951171875, 0.0016231536865234375, 0.001728057861328125, 0.0018329620361328125, 0.0019378662109375, 0.0020427703857421875, 0.002147674560546875, 0.0022525787353515625, 0.00235748291015625, 0.0024623870849609375, 0.002567291259765625, 0.0026721954345703125, 0.002777099609375, 0.0028820037841796875, 0.002986907958984375, 0.0030918121337890625, 0.00319671630859375, 0.0033016204833984375, 0.003406524658203125]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 2.0, 3.0, 10.0, 8.0, 8.0, 12.0, 14.0, 27.0, 29.0, 28.0, 44.0, 56.0, 83.0, 100.0, 139.0, 265.0, 619.0, 9037.0, 936400.0, 99086.0, 1547.0, 355.0, 190.0, 128.0, 71.0, 72.0, 48.0, 37.0, 33.0, 22.0, 19.0, 14.0, 9.0, 7.0, 10.0, 3.0, 3.0, 2.0, 2.0, 3.0, 0.0, 4.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0784912109375, -0.07609367370605469, -0.07369613647460938, -0.07129859924316406, -0.06890106201171875, -0.06650352478027344, -0.06410598754882812, -0.06170845031738281, -0.0593109130859375, -0.05691337585449219, -0.054515838623046875, -0.05211830139160156, -0.04972076416015625, -0.04732322692871094, -0.044925689697265625, -0.04252815246582031, -0.040130615234375, -0.03773307800292969, -0.035335540771484375, -0.03293800354003906, -0.03054046630859375, -0.028142929077148438, -0.025745391845703125, -0.023347854614257812, -0.0209503173828125, -0.018552780151367188, -0.016155242919921875, -0.013757705688476562, -0.01136016845703125, -0.008962631225585938, -0.006565093994140625, -0.0041675567626953125, -0.00177001953125, 0.0006275177001953125, 0.003025054931640625, 0.0054225921630859375, 0.00782012939453125, 0.010217666625976562, 0.012615203857421875, 0.015012741088867188, 0.0174102783203125, 0.019807815551757812, 0.022205352783203125, 0.024602890014648438, 0.02700042724609375, 0.029397964477539062, 0.031795501708984375, 0.03419303894042969, 0.036590576171875, 0.03898811340332031, 0.041385650634765625, 0.04378318786621094, 0.04618072509765625, 0.04857826232910156, 0.050975799560546875, 0.05337333679199219, 0.0557708740234375, 0.05816841125488281, 0.060565948486328125, 0.06296348571777344, 0.06536102294921875, 0.06775856018066406, 0.07015609741210938, 0.07255363464355469, 0.074951171875]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 20.0, 140.0, 533.0, 246.0, 58.0, 10.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.028252651914954185, -0.027736257761716843, -0.0272198636084795, -0.026703469455242157, -0.026187075302004814, -0.02567068114876747, -0.02515428699553013, -0.024637892842292786, -0.024121496826410294, -0.02360510267317295, -0.023088708519935608, -0.022572314366698265, -0.022055920213460922, -0.02153952606022358, -0.021023131906986237, -0.020506735891103745, -0.01999034360051155, -0.019473949447274208, -0.018957555294036865, -0.018441161140799522, -0.01792476698756218, -0.017408372834324837, -0.016891978681087494, -0.016375582665205002, -0.015859190374612808, -0.015342796221375465, -0.014826402068138123, -0.01431000791490078, -0.013793613761663437, -0.013277219608426094, -0.012760824523866177, -0.012244430370628834, -0.011728035286068916, -0.011211641132831573, -0.01069524697959423, -0.010178852826356888, -0.009662458673119545, -0.009146064519882202, -0.008629669435322285, -0.008113275282084942, -0.007596881128847599, -0.007080486975610256, -0.006564092822372913, -0.006047698203474283, -0.00553130405023694, -0.0050149098969995975, -0.004498515278100967, -0.003982121124863625, -0.0034657269716262817, -0.002949332818388939, -0.0024329384323209524, -0.0019165441626682878, -0.001400149893015623, -0.0008837557397782803, -0.00036736135371029377, 0.00014903303235769272, 0.0006654271855950356, 0.0011818214552477002, 0.0016982157249003649, 0.0022146101109683514, 0.002731004264205694, 0.003247398417443037, 0.0037637928035110235, 0.00428018718957901, 0.004796581342816353]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 6.0, 3.0, 7.0, 11.0, 14.0, 15.0, 27.0, 20.0, 35.0, 23.0, 26.0, 35.0, 37.0, 31.0, 44.0, 50.0, 36.0, 40.0, 49.0, 46.0, 51.0, 52.0, 38.0, 45.0, 30.0, 22.0, 34.0, 41.0, 17.0, 22.0, 20.0, 21.0, 11.0, 11.0, 9.0, 4.0, 7.0, 7.0, 4.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0024050474166870117, -0.002334785647690296, -0.0022645238786935806, -0.002194262109696865, -0.0021240003407001495, -0.002053738571703434, -0.0019834768027067184, -0.001913215033710003, -0.0018429532647132874, -0.0017726914957165718, -0.0017024297267198563, -0.0016321679577231407, -0.0015619061887264252, -0.0014916444197297096, -0.001421382650732994, -0.0013511208817362785, -0.001280859112739563, -0.0012105973437428474, -0.001140335574746132, -0.0010700738057494164, -0.0009998120367527008, -0.0009295502677559853, -0.0008592884987592697, -0.0007890267297625542, -0.0007187649607658386, -0.0006485031917691231, -0.0005782414227724075, -0.000507979653775692, -0.00043771788477897644, -0.0003674561157822609, -0.00029719434678554535, -0.0002269325777888298, -0.00015667080879211426, -8.640903979539871e-05, -1.6147270798683167e-05, 5.411449819803238e-05, 0.00012437626719474792, 0.00019463803619146347, 0.000264899805188179, 0.00033516157418489456, 0.0004054233431816101, 0.00047568511217832565, 0.0005459468811750412, 0.0006162086501717567, 0.0006864704191684723, 0.0007567321881651878, 0.0008269939571619034, 0.0008972557261586189, 0.0009675174951553345, 0.00103777926415205, 0.0011080410331487656, 0.0011783028021454811, 0.0012485645711421967, 0.0013188263401389122, 0.0013890881091356277, 0.0014593498781323433, 0.0015296116471290588, 0.0015998734161257744, 0.00167013518512249, 0.0017403969541192055, 0.001810658723115921, 0.0018809204921126366, 0.0019511822611093521, 0.0020214440301060677, 0.002091705799102783]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 6.0, 7.0, 10.0, 5.0, 9.0, 7.0, 12.0, 10.0, 13.0, 15.0, 21.0, 27.0, 29.0, 22.0, 36.0, 27.0, 34.0, 42.0, 47.0, 42.0, 41.0, 50.0, 30.0, 44.0, 40.0, 41.0, 42.0, 30.0, 36.0, 31.0, 26.0, 23.0, 21.0, 20.0, 19.0, 10.0, 17.0, 9.0, 11.0, 7.0, 10.0, 4.0, 6.0, 5.0, 4.0, 2.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.3359375, -6.125, -5.9140625, -5.703125, -5.4921875, -5.28125, -5.0703125, -4.859375, -4.6484375, -4.4375, -4.2265625, -4.015625, -3.8046875, -3.59375, -3.3828125, -3.171875, -2.9609375, -2.75, -2.5390625, -2.328125, -2.1171875, -1.90625, -1.6953125, -1.484375, -1.2734375, -1.0625, -0.8515625, -0.640625, -0.4296875, -0.21875, -0.0078125, 0.203125, 0.4140625, 0.625, 0.8359375, 1.046875, 1.2578125, 1.46875, 1.6796875, 1.890625, 2.1015625, 2.3125, 2.5234375, 2.734375, 2.9453125, 3.15625, 3.3671875, 3.578125, 3.7890625, 4.0, 4.2109375, 4.421875, 4.6328125, 4.84375, 5.0546875, 5.265625, 5.4765625, 5.6875, 5.8984375, 6.109375, 6.3203125, 6.53125, 6.7421875, 6.953125, 7.1640625]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 8.0, 11.0, 11.0, 10.0, 15.0, 15.0, 11.0, 37.0, 30.0, 41.0, 60.0, 75.0, 114.0, 130.0, 232.0, 344.0, 633.0, 1336.0, 3459.0, 13149.0, 74670.0, 747616.0, 174254.0, 22854.0, 5562.0, 1778.0, 786.0, 421.0, 260.0, 168.0, 114.0, 69.0, 61.0, 51.0, 40.0, 27.0, 24.0, 12.0, 14.0, 18.0, 8.0, 6.0, 7.0, 3.0, 5.0, 2.0, 3.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.3828125, -10.999267578125, -10.61572265625, -10.232177734375, -9.8486328125, -9.465087890625, -9.08154296875, -8.697998046875, -8.314453125, -7.930908203125, -7.54736328125, -7.163818359375, -6.7802734375, -6.396728515625, -6.01318359375, -5.629638671875, -5.24609375, -4.862548828125, -4.47900390625, -4.095458984375, -3.7119140625, -3.328369140625, -2.94482421875, -2.561279296875, -2.177734375, -1.794189453125, -1.41064453125, -1.027099609375, -0.6435546875, -0.260009765625, 0.12353515625, 0.507080078125, 0.890625, 1.274169921875, 1.65771484375, 2.041259765625, 2.4248046875, 2.808349609375, 3.19189453125, 3.575439453125, 3.958984375, 4.342529296875, 4.72607421875, 5.109619140625, 5.4931640625, 5.876708984375, 6.26025390625, 6.643798828125, 7.02734375, 7.410888671875, 7.79443359375, 8.177978515625, 8.5615234375, 8.945068359375, 9.32861328125, 9.712158203125, 10.095703125, 10.479248046875, 10.86279296875, 11.246337890625, 11.6298828125, 12.013427734375, 12.39697265625, 12.780517578125, 13.1640625]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 2.0, 1.0, 5.0, 8.0, 3.0, 7.0, 8.0, 11.0, 8.0, 8.0, 20.0, 20.0, 25.0, 33.0, 33.0, 24.0, 22.0, 35.0, 41.0, 44.0, 63.0, 155.0, 1776.0, 204.0, 59.0, 45.0, 52.0, 49.0, 47.0, 35.0, 38.0, 29.0, 29.0, 12.0, 26.0, 19.0, 11.0, 10.0, 11.0, 8.0, 3.0, 8.0, 2.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.125, -18.457275390625, -17.78955078125, -17.121826171875, -16.4541015625, -15.786376953125, -15.11865234375, -14.450927734375, -13.783203125, -13.115478515625, -12.44775390625, -11.780029296875, -11.1123046875, -10.444580078125, -9.77685546875, -9.109130859375, -8.44140625, -7.773681640625, -7.10595703125, -6.438232421875, -5.7705078125, -5.102783203125, -4.43505859375, -3.767333984375, -3.099609375, -2.431884765625, -1.76416015625, -1.096435546875, -0.4287109375, 0.239013671875, 0.90673828125, 1.574462890625, 2.2421875, 2.909912109375, 3.57763671875, 4.245361328125, 4.9130859375, 5.580810546875, 6.24853515625, 6.916259765625, 7.583984375, 8.251708984375, 8.91943359375, 9.587158203125, 10.2548828125, 10.922607421875, 11.59033203125, 12.258056640625, 12.92578125, 13.593505859375, 14.26123046875, 14.928955078125, 15.5966796875, 16.264404296875, 16.93212890625, 17.599853515625, 18.267578125, 18.935302734375, 19.60302734375, 20.270751953125, 20.9384765625, 21.606201171875, 22.27392578125, 22.941650390625, 23.609375]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 3.0, 9.0, 6.0, 11.0, 10.0, 12.0, 11.0, 27.0, 24.0, 30.0, 44.0, 48.0, 67.0, 65.0, 115.0, 177.0, 313.0, 801.0, 14052.0, 3121063.0, 7328.0, 636.0, 304.0, 141.0, 87.0, 59.0, 47.0, 43.0, 33.0, 31.0, 24.0, 18.0, 7.0, 15.0, 10.0, 7.0, 6.0, 7.0, 7.0, 0.0, 5.0, 1.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-71.125, -69.0595703125, -66.994140625, -64.9287109375, -62.86328125, -60.7978515625, -58.732421875, -56.6669921875, -54.6015625, -52.5361328125, -50.470703125, -48.4052734375, -46.33984375, -44.2744140625, -42.208984375, -40.1435546875, -38.078125, -36.0126953125, -33.947265625, -31.8818359375, -29.81640625, -27.7509765625, -25.685546875, -23.6201171875, -21.5546875, -19.4892578125, -17.423828125, -15.3583984375, -13.29296875, -11.2275390625, -9.162109375, -7.0966796875, -5.03125, -2.9658203125, -0.900390625, 1.1650390625, 3.23046875, 5.2958984375, 7.361328125, 9.4267578125, 11.4921875, 13.5576171875, 15.623046875, 17.6884765625, 19.75390625, 21.8193359375, 23.884765625, 25.9501953125, 28.015625, 30.0810546875, 32.146484375, 34.2119140625, 36.27734375, 38.3427734375, 40.408203125, 42.4736328125, 44.5390625, 46.6044921875, 48.669921875, 50.7353515625, 52.80078125, 54.8662109375, 56.931640625, 58.9970703125, 61.0625]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 110.0, 746.0, 157.0, 5.0], "bins": [-245.0657196044922, -241.08157348632812, -237.09744262695312, -233.11329650878906, -229.129150390625, -225.14500427246094, -221.16085815429688, -217.17672729492188, -213.1925811767578, -209.20843505859375, -205.22430419921875, -201.2401580810547, -197.25601196289062, -193.27186584472656, -189.2877197265625, -185.3035888671875, -181.31944274902344, -177.33529663085938, -173.35116577148438, -169.3670196533203, -165.38287353515625, -161.3987274169922, -157.41458129882812, -153.43045043945312, -149.44630432128906, -145.462158203125, -141.47802734375, -137.49388122558594, -133.50973510742188, -129.5255889892578, -125.54145050048828, -121.55731201171875, -117.57316589355469, -113.58901977539062, -109.6048812866211, -105.62074279785156, -101.6365966796875, -97.65245056152344, -93.6683120727539, -89.68417358398438, -85.70002746582031, -81.71588134765625, -77.73174285888672, -73.74760437011719, -69.76345825195312, -65.77931213378906, -61.79517364501953, -57.811031341552734, -53.82688522338867, -49.842742919921875, -45.85860061645508, -41.87445831298828, -37.890316009521484, -33.90617370605469, -29.92203140258789, -25.937889099121094, -21.953746795654297, -17.9696044921875, -13.985462188720703, -10.001319885253906, -6.017177581787109, -2.0330352783203125, 1.9511070251464844, 5.935249328613281, 9.919390678405762]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 6.0, 2.0, 8.0, 11.0, 7.0, 6.0, 12.0, 17.0, 16.0, 16.0, 19.0, 17.0, 30.0, 28.0, 18.0, 40.0, 34.0, 32.0, 33.0, 36.0, 35.0, 39.0, 41.0, 40.0, 33.0, 45.0, 40.0, 31.0, 38.0, 27.0, 21.0, 32.0, 27.0, 17.0, 20.0, 19.0, 16.0, 19.0, 10.0, 12.0, 11.0, 8.0, 7.0, 3.0, 7.0, 4.0, 7.0, 3.0, 2.0, 1.0, 2.0, 2.0], "bins": [-62.56318664550781, -60.72850036621094, -58.89381408691406, -57.05912780761719, -55.22444152832031, -53.38975524902344, -51.55506896972656, -49.72038269042969, -47.88569641113281, -46.05101013183594, -44.21632385253906, -42.38163757324219, -40.54695129394531, -38.71226501464844, -36.87757873535156, -35.04289245605469, -33.20820236206055, -31.373516082763672, -29.538829803466797, -27.704143524169922, -25.869457244873047, -24.034770965576172, -22.200082778930664, -20.36539649963379, -18.530710220336914, -16.69602394104004, -14.861337661743164, -13.026650428771973, -11.191964149475098, -9.357277870178223, -7.522590637207031, -5.687904357910156, -3.8532180786132812, -2.018531560897827, -0.18384504318237305, 1.6508417129516602, 3.485527992248535, 5.32021427154541, 7.154901504516602, 8.989587783813477, 10.824274063110352, 12.658960342407227, 14.493646621704102, 16.32833480834961, 18.163021087646484, 19.99770736694336, 21.832393646240234, 23.66707992553711, 25.501766204833984, 27.33645248413086, 29.171138763427734, 31.00582504272461, 32.840511322021484, 34.67519760131836, 36.5098876953125, 38.344573974609375, 40.17926025390625, 42.013946533203125, 43.8486328125, 45.683319091796875, 47.51800537109375, 49.352691650390625, 51.1873779296875, 53.022064208984375, 54.85675048828125]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 3.0, 7.0, 5.0, 4.0, 2.0, 11.0, 6.0, 10.0, 13.0, 7.0, 22.0, 22.0, 21.0, 26.0, 24.0, 32.0, 36.0, 30.0, 48.0, 42.0, 48.0, 41.0, 50.0, 36.0, 44.0, 37.0, 48.0, 42.0, 36.0, 38.0, 30.0, 23.0, 24.0, 21.0, 19.0, 16.0, 20.0, 5.0, 6.0, 14.0, 10.0, 9.0, 6.0, 3.0, 2.0, 5.0, 1.0, 2.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.21875, -6.98614501953125, -6.7535400390625, -6.52093505859375, -6.288330078125, -6.05572509765625, -5.8231201171875, -5.59051513671875, -5.35791015625, -5.12530517578125, -4.8927001953125, -4.66009521484375, -4.427490234375, -4.19488525390625, -3.9622802734375, -3.72967529296875, -3.4970703125, -3.26446533203125, -3.0318603515625, -2.79925537109375, -2.566650390625, -2.33404541015625, -2.1014404296875, -1.86883544921875, -1.63623046875, -1.40362548828125, -1.1710205078125, -0.93841552734375, -0.705810546875, -0.47320556640625, -0.2406005859375, -0.00799560546875, 0.224609375, 0.45721435546875, 0.6898193359375, 0.92242431640625, 1.155029296875, 1.38763427734375, 1.6202392578125, 1.85284423828125, 2.08544921875, 2.31805419921875, 2.5506591796875, 2.78326416015625, 3.015869140625, 3.24847412109375, 3.4810791015625, 3.71368408203125, 3.9462890625, 4.17889404296875, 4.4114990234375, 4.64410400390625, 4.876708984375, 5.10931396484375, 5.3419189453125, 5.57452392578125, 5.80712890625, 6.03973388671875, 6.2723388671875, 6.50494384765625, 6.737548828125, 6.97015380859375, 7.2027587890625, 7.43536376953125, 7.66796875]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 5.0, 3.0, 6.0, 4.0, 9.0, 4.0, 11.0, 10.0, 17.0, 23.0, 38.0, 34.0, 56.0, 79.0, 136.0, 203.0, 287.0, 466.0, 763.0, 1361.0, 2472.0, 4900.0, 10476.0, 26248.0, 86239.0, 331269.0, 1018546.0, 1557390.0, 808837.0, 239734.0, 64975.0, 21212.0, 8755.0, 4182.0, 2266.0, 1186.0, 713.0, 471.0, 277.0, 172.0, 119.0, 103.0, 65.0, 45.0, 36.0, 26.0, 19.0, 13.0, 13.0, 7.0, 7.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-8.328125, -8.062744140625, -7.79736328125, -7.531982421875, -7.2666015625, -7.001220703125, -6.73583984375, -6.470458984375, -6.205078125, -5.939697265625, -5.67431640625, -5.408935546875, -5.1435546875, -4.878173828125, -4.61279296875, -4.347412109375, -4.08203125, -3.816650390625, -3.55126953125, -3.285888671875, -3.0205078125, -2.755126953125, -2.48974609375, -2.224365234375, -1.958984375, -1.693603515625, -1.42822265625, -1.162841796875, -0.8974609375, -0.632080078125, -0.36669921875, -0.101318359375, 0.1640625, 0.429443359375, 0.69482421875, 0.960205078125, 1.2255859375, 1.490966796875, 1.75634765625, 2.021728515625, 2.287109375, 2.552490234375, 2.81787109375, 3.083251953125, 3.3486328125, 3.614013671875, 3.87939453125, 4.144775390625, 4.41015625, 4.675537109375, 4.94091796875, 5.206298828125, 5.4716796875, 5.737060546875, 6.00244140625, 6.267822265625, 6.533203125, 6.798583984375, 7.06396484375, 7.329345703125, 7.5947265625, 7.860107421875, 8.12548828125, 8.390869140625, 8.65625]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 12.0, 5.0, 22.0, 36.0, 50.0, 100.0, 113.0, 179.0, 268.0, 408.0, 621.0, 687.0, 532.0, 366.0, 258.0, 144.0, 97.0, 60.0, 52.0, 23.0, 19.0, 8.0, 6.0, 8.0, 7.0, 1.0, 1.0], "bins": [-29.265625, -28.6602783203125, -28.054931640625, -27.4495849609375, -26.84423828125, -26.2388916015625, -25.633544921875, -25.0281982421875, -24.4228515625, -23.8175048828125, -23.212158203125, -22.6068115234375, -22.00146484375, -21.3961181640625, -20.790771484375, -20.1854248046875, -19.580078125, -18.9747314453125, -18.369384765625, -17.7640380859375, -17.15869140625, -16.5533447265625, -15.947998046875, -15.3426513671875, -14.7373046875, -14.1319580078125, -13.526611328125, -12.9212646484375, -12.31591796875, -11.7105712890625, -11.105224609375, -10.4998779296875, -9.89453125, -9.2891845703125, -8.683837890625, -8.0784912109375, -7.47314453125, -6.8677978515625, -6.262451171875, -5.6571044921875, -5.0517578125, -4.4464111328125, -3.841064453125, -3.2357177734375, -2.63037109375, -2.0250244140625, -1.419677734375, -0.8143310546875, -0.208984375, 0.3963623046875, 1.001708984375, 1.6070556640625, 2.21240234375, 2.8177490234375, 3.423095703125, 4.0284423828125, 4.6337890625, 5.2391357421875, 5.844482421875, 6.4498291015625, 7.05517578125, 7.6605224609375, 8.265869140625, 8.8712158203125, 9.4765625]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 9.0, 15.0, 17.0, 32.0, 65.0, 103.0, 158.0, 282.0, 440.0, 1007.0, 7899.0, 4055565.0, 125536.0, 1680.0, 608.0, 357.0, 223.0, 125.0, 72.0, 44.0, 29.0, 16.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.9375, -60.2841796875, -57.630859375, -54.9775390625, -52.32421875, -49.6708984375, -47.017578125, -44.3642578125, -41.7109375, -39.0576171875, -36.404296875, -33.7509765625, -31.09765625, -28.4443359375, -25.791015625, -23.1376953125, -20.484375, -17.8310546875, -15.177734375, -12.5244140625, -9.87109375, -7.2177734375, -4.564453125, -1.9111328125, 0.7421875, 3.3955078125, 6.048828125, 8.7021484375, 11.35546875, 14.0087890625, 16.662109375, 19.3154296875, 21.96875, 24.6220703125, 27.275390625, 29.9287109375, 32.58203125, 35.2353515625, 37.888671875, 40.5419921875, 43.1953125, 45.8486328125, 48.501953125, 51.1552734375, 53.80859375, 56.4619140625, 59.115234375, 61.7685546875, 64.421875, 67.0751953125, 69.728515625, 72.3818359375, 75.03515625, 77.6884765625, 80.341796875, 82.9951171875, 85.6484375, 88.3017578125, 90.955078125, 93.6083984375, 96.26171875, 98.9150390625, 101.568359375, 104.2216796875, 106.875]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 342.0, 676.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1392.4459228515625, -1367.169921875, -1341.89404296875, -1316.6180419921875, -1291.3421630859375, -1266.066162109375, -1240.790283203125, -1215.5142822265625, -1190.2384033203125, -1164.96240234375, -1139.6865234375, -1114.4105224609375, -1089.1346435546875, -1063.858642578125, -1038.582763671875, -1013.3067626953125, -988.0308227539062, -962.7548828125, -937.4789428710938, -912.2030029296875, -886.9270629882812, -861.651123046875, -836.3751220703125, -811.0992431640625, -785.8232421875, -760.5473022460938, -735.2713623046875, -709.9954223632812, -684.719482421875, -659.4435424804688, -634.1676025390625, -608.8916015625, -583.61572265625, -558.3397827148438, -533.0638427734375, -507.78790283203125, -482.511962890625, -457.23602294921875, -431.9600524902344, -406.6841125488281, -381.408203125, -356.13226318359375, -330.8563232421875, -305.58038330078125, -280.304443359375, -255.0284881591797, -229.75253295898438, -204.47659301757812, -179.2006378173828, -153.92469787597656, -128.64874267578125, -103.372802734375, -78.09686279296875, -52.8209228515625, -27.544967651367188, -2.2690277099609375, 23.006912231445312, 48.28285598754883, 73.55879974365234, 98.83474731445312, 124.11068725585938, 149.38662719726562, 174.66258239746094, 199.9385223388672, 225.21446228027344]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 8.0, 4.0, 9.0, 15.0, 18.0, 12.0, 26.0, 31.0, 27.0, 43.0, 48.0, 51.0, 50.0, 58.0, 58.0, 62.0, 62.0, 47.0, 55.0, 50.0, 56.0, 45.0, 33.0, 40.0, 26.0, 20.0, 23.0, 14.0, 5.0, 5.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.742645263671875, -43.7707633972168, -41.79888153076172, -39.82699966430664, -37.85511779785156, -35.88323974609375, -33.91135787963867, -31.939476013183594, -29.967594146728516, -27.995712280273438, -26.02383041381836, -24.051950454711914, -22.080068588256836, -20.108186721801758, -18.136306762695312, -16.164424896240234, -14.192543029785156, -12.220661163330078, -10.248780250549316, -8.276899337768555, -6.305017471313477, -4.333135604858398, -2.3612546920776367, -0.389373779296875, 1.5825080871582031, 3.554389476776123, 5.526270866394043, 7.498152256011963, 9.470033645629883, 11.441915512084961, 13.413796424865723, 15.385677337646484, 17.357559204101562, 19.32944107055664, 21.30132293701172, 23.273202896118164, 25.245084762573242, 27.21696662902832, 29.188846588134766, 31.160728454589844, 33.13261032104492, 35.1044921875, 37.07637405395508, 39.048255920410156, 41.02013397216797, 42.99201965332031, 44.963897705078125, 46.9357795715332, 48.90766143798828, 50.87954330444336, 52.85142517089844, 54.823307037353516, 56.795188903808594, 58.767066955566406, 60.738948822021484, 62.71083068847656, 64.68270874023438, 66.65458679199219, 68.62647247314453, 70.59835052490234, 72.57023620605469, 74.5421142578125, 76.51399993896484, 78.48587799072266, 80.457763671875]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 8.0, 6.0, 2.0, 2.0, 5.0, 8.0, 8.0, 8.0, 9.0, 13.0, 16.0, 19.0, 18.0, 25.0, 30.0, 26.0, 35.0, 34.0, 36.0, 38.0, 37.0, 45.0, 43.0, 40.0, 46.0, 39.0, 63.0, 40.0, 46.0, 32.0, 23.0, 26.0, 24.0, 29.0, 19.0, 15.0, 16.0, 12.0, 8.0, 9.0, 7.0, 12.0, 7.0, 4.0, 4.0, 5.0, 3.0, 2.0, 0.0, 0.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.53515625, -6.3214111328125, -6.107666015625, -5.8939208984375, -5.68017578125, -5.4664306640625, -5.252685546875, -5.0389404296875, -4.8251953125, -4.6114501953125, -4.397705078125, -4.1839599609375, -3.97021484375, -3.7564697265625, -3.542724609375, -3.3289794921875, -3.115234375, -2.9014892578125, -2.687744140625, -2.4739990234375, -2.26025390625, -2.0465087890625, -1.832763671875, -1.6190185546875, -1.4052734375, -1.1915283203125, -0.977783203125, -0.7640380859375, -0.55029296875, -0.3365478515625, -0.122802734375, 0.0909423828125, 0.3046875, 0.5184326171875, 0.732177734375, 0.9459228515625, 1.15966796875, 1.3734130859375, 1.587158203125, 1.8009033203125, 2.0146484375, 2.2283935546875, 2.442138671875, 2.6558837890625, 2.86962890625, 3.0833740234375, 3.297119140625, 3.5108642578125, 3.724609375, 3.9383544921875, 4.152099609375, 4.3658447265625, 4.57958984375, 4.7933349609375, 5.007080078125, 5.2208251953125, 5.4345703125, 5.6483154296875, 5.862060546875, 6.0758056640625, 6.28955078125, 6.5032958984375, 6.717041015625, 6.9307861328125, 7.14453125]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 8.0, 6.0, 13.0, 21.0, 39.0, 51.0, 69.0, 94.0, 170.0, 248.0, 358.0, 501.0, 679.0, 1040.0, 1590.0, 2242.0, 3376.0, 4780.0, 7045.0, 10458.0, 15408.0, 22632.0, 34583.0, 51116.0, 77387.0, 110941.0, 147149.0, 157669.0, 126405.0, 89143.0, 60510.0, 39794.0, 26825.0, 18041.0, 12245.0, 8298.0, 5520.0, 3900.0, 2583.0, 1810.0, 1204.0, 821.0, 591.0, 381.0, 282.0, 180.0, 128.0, 81.0, 52.0, 41.0, 22.0, 18.0, 5.0, 7.0, 2.0, 1.0, 2.0, 2.0], "bins": [-0.6103515625, -0.5919647216796875, -0.573577880859375, -0.5551910400390625, -0.53680419921875, -0.5184173583984375, -0.500030517578125, -0.4816436767578125, -0.4632568359375, -0.4448699951171875, -0.426483154296875, -0.4080963134765625, -0.38970947265625, -0.3713226318359375, -0.352935791015625, -0.3345489501953125, -0.316162109375, -0.2977752685546875, -0.279388427734375, -0.2610015869140625, -0.24261474609375, -0.2242279052734375, -0.205841064453125, -0.1874542236328125, -0.1690673828125, -0.1506805419921875, -0.132293701171875, -0.1139068603515625, -0.09552001953125, -0.0771331787109375, -0.058746337890625, -0.0403594970703125, -0.02197265625, -0.0035858154296875, 0.014801025390625, 0.0331878662109375, 0.05157470703125, 0.0699615478515625, 0.088348388671875, 0.1067352294921875, 0.1251220703125, 0.1435089111328125, 0.161895751953125, 0.1802825927734375, 0.19866943359375, 0.2170562744140625, 0.235443115234375, 0.2538299560546875, 0.272216796875, 0.2906036376953125, 0.308990478515625, 0.3273773193359375, 0.34576416015625, 0.3641510009765625, 0.382537841796875, 0.4009246826171875, 0.4193115234375, 0.4376983642578125, 0.456085205078125, 0.4744720458984375, 0.49285888671875, 0.5112457275390625, 0.529632568359375, 0.5480194091796875, 0.56640625]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 1.0, 5.0, 6.0, 5.0, 8.0, 10.0, 4.0, 5.0, 15.0, 14.0, 18.0, 23.0, 27.0, 15.0, 24.0, 31.0, 38.0, 32.0, 30.0, 48.0, 36.0, 44.0, 42.0, 1065.0, 38.0, 44.0, 39.0, 32.0, 35.0, 29.0, 37.0, 23.0, 25.0, 21.0, 35.0, 23.0, 21.0, 15.0, 12.0, 12.0, 8.0, 7.0, 6.0, 5.0, 5.0, 5.0, 5.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.5546875, -4.4183349609375, -4.281982421875, -4.1456298828125, -4.00927734375, -3.8729248046875, -3.736572265625, -3.6002197265625, -3.4638671875, -3.3275146484375, -3.191162109375, -3.0548095703125, -2.91845703125, -2.7821044921875, -2.645751953125, -2.5093994140625, -2.373046875, -2.2366943359375, -2.100341796875, -1.9639892578125, -1.82763671875, -1.6912841796875, -1.554931640625, -1.4185791015625, -1.2822265625, -1.1458740234375, -1.009521484375, -0.8731689453125, -0.73681640625, -0.6004638671875, -0.464111328125, -0.3277587890625, -0.19140625, -0.0550537109375, 0.081298828125, 0.2176513671875, 0.35400390625, 0.4903564453125, 0.626708984375, 0.7630615234375, 0.8994140625, 1.0357666015625, 1.172119140625, 1.3084716796875, 1.44482421875, 1.5811767578125, 1.717529296875, 1.8538818359375, 1.990234375, 2.1265869140625, 2.262939453125, 2.3992919921875, 2.53564453125, 2.6719970703125, 2.808349609375, 2.9447021484375, 3.0810546875, 3.2174072265625, 3.353759765625, 3.4901123046875, 3.62646484375, 3.7628173828125, 3.899169921875, 4.0355224609375, 4.171875]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 9.0, 18.0, 24.0, 35.0, 52.0, 72.0, 128.0, 202.0, 290.0, 498.0, 827.0, 1311.0, 1945.0, 3292.0, 5429.0, 8747.0, 13987.0, 22692.0, 36774.0, 58017.0, 89471.0, 127933.0, 1047659.0, 316026.0, 125412.0, 86720.0, 56909.0, 35565.0, 21751.0, 13566.0, 8385.0, 5147.0, 3148.0, 1857.0, 1184.0, 735.0, 478.0, 281.0, 180.0, 131.0, 85.0, 57.0, 32.0, 21.0, 19.0, 16.0, 11.0, 2.0, 3.0, 1.0, 0.0, 3.0], "bins": [-0.58447265625, -0.5677566528320312, -0.5510406494140625, -0.5343246459960938, -0.517608642578125, -0.5008926391601562, -0.4841766357421875, -0.46746063232421875, -0.45074462890625, -0.43402862548828125, -0.4173126220703125, -0.40059661865234375, -0.383880615234375, -0.36716461181640625, -0.3504486083984375, -0.33373260498046875, -0.3170166015625, -0.30030059814453125, -0.2835845947265625, -0.26686859130859375, -0.250152587890625, -0.23343658447265625, -0.2167205810546875, -0.20000457763671875, -0.18328857421875, -0.16657257080078125, -0.1498565673828125, -0.13314056396484375, -0.116424560546875, -0.09970855712890625, -0.0829925537109375, -0.06627655029296875, -0.049560546875, -0.03284454345703125, -0.0161285400390625, 0.00058746337890625, 0.017303466796875, 0.03401947021484375, 0.0507354736328125, 0.06745147705078125, 0.08416748046875, 0.10088348388671875, 0.1175994873046875, 0.13431549072265625, 0.151031494140625, 0.16774749755859375, 0.1844635009765625, 0.20117950439453125, 0.2178955078125, 0.23461151123046875, 0.2513275146484375, 0.26804351806640625, 0.284759521484375, 0.30147552490234375, 0.3181915283203125, 0.33490753173828125, 0.35162353515625, 0.36833953857421875, 0.3850555419921875, 0.40177154541015625, 0.418487548828125, 0.43520355224609375, 0.4519195556640625, 0.46863555908203125, 0.4853515625]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 5.0, 5.0, 3.0, 9.0, 16.0, 14.0, 27.0, 25.0, 36.0, 47.0, 54.0, 63.0, 60.0, 65.0, 74.0, 78.0, 80.0, 44.0, 53.0, 41.0, 47.0, 39.0, 22.0, 18.0, 13.0, 24.0, 11.0, 2.0, 5.0, 8.0, 6.0, 2.0, 3.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0037250518798828125, -0.0035968124866485596, -0.0034685730934143066, -0.0033403337001800537, -0.0032120943069458008, -0.003083854913711548, -0.002955615520477295, -0.002827376127243042, -0.002699136734008789, -0.002570897340774536, -0.002442657947540283, -0.0023144185543060303, -0.0021861791610717773, -0.0020579397678375244, -0.0019297003746032715, -0.0018014609813690186, -0.0016732215881347656, -0.0015449821949005127, -0.0014167428016662598, -0.0012885034084320068, -0.001160264015197754, -0.001032024621963501, -0.000903785228729248, -0.0007755458354949951, -0.0006473064422607422, -0.0005190670490264893, -0.00039082765579223633, -0.0002625882625579834, -0.00013434886932373047, -6.109476089477539e-06, 0.0001221299171447754, 0.0002503693103790283, 0.00037860870361328125, 0.0005068480968475342, 0.0006350874900817871, 0.00076332688331604, 0.000891566276550293, 0.001019805669784546, 0.0011480450630187988, 0.0012762844562530518, 0.0014045238494873047, 0.0015327632427215576, 0.0016610026359558105, 0.0017892420291900635, 0.0019174814224243164, 0.0020457208156585693, 0.0021739602088928223, 0.002302199602127075, 0.002430438995361328, 0.002558678388595581, 0.002686917781829834, 0.002815157175064087, 0.00294339656829834, 0.0030716359615325928, 0.0031998753547668457, 0.0033281147480010986, 0.0034563541412353516, 0.0035845935344696045, 0.0037128329277038574, 0.0038410723209381104, 0.003969311714172363, 0.004097551107406616, 0.004225790500640869, 0.004354029893875122, 0.004482269287109375]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 9.0, 9.0, 7.0, 18.0, 25.0, 36.0, 25.0, 56.0, 76.0, 115.0, 183.0, 351.0, 3169.0, 955740.0, 87006.0, 978.0, 267.0, 156.0, 108.0, 69.0, 45.0, 31.0, 30.0, 16.0, 4.0, 7.0, 5.0, 2.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11474609375, -0.1115407943725586, -0.10833549499511719, -0.10513019561767578, -0.10192489624023438, -0.09871959686279297, -0.09551429748535156, -0.09230899810791016, -0.08910369873046875, -0.08589839935302734, -0.08269309997558594, -0.07948780059814453, -0.07628250122070312, -0.07307720184326172, -0.06987190246582031, -0.0666666030883789, -0.0634613037109375, -0.060256004333496094, -0.05705070495605469, -0.05384540557861328, -0.050640106201171875, -0.04743480682373047, -0.04422950744628906, -0.041024208068847656, -0.03781890869140625, -0.034613609313964844, -0.03140830993652344, -0.02820301055908203, -0.024997711181640625, -0.02179241180419922, -0.018587112426757812, -0.015381813049316406, -0.012176513671875, -0.008971214294433594, -0.0057659149169921875, -0.0025606155395507812, 0.000644683837890625, 0.0038499832153320312, 0.0070552825927734375, 0.010260581970214844, 0.01346588134765625, 0.016671180725097656, 0.019876480102539062, 0.02308177947998047, 0.026287078857421875, 0.02949237823486328, 0.03269767761230469, 0.035902976989746094, 0.0391082763671875, 0.042313575744628906, 0.04551887512207031, 0.04872417449951172, 0.051929473876953125, 0.05513477325439453, 0.05834007263183594, 0.061545372009277344, 0.06475067138671875, 0.06795597076416016, 0.07116127014160156, 0.07436656951904297, 0.07757186889648438, 0.08077716827392578, 0.08398246765136719, 0.0871877670288086, 0.09039306640625]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 180.0, 805.0, 29.0, 4.0], "bins": [-0.06408385932445526, -0.06303854286670685, -0.061993226408958435, -0.06094790995121002, -0.05990259349346161, -0.058857280761003494, -0.05781196430325508, -0.05676664784550667, -0.055721331387758255, -0.05467601493000984, -0.05363069847226143, -0.052585382014513016, -0.0515400692820549, -0.05049475282430649, -0.049449436366558075, -0.04840411990880966, -0.04735880345106125, -0.046313486993312836, -0.04526817053556442, -0.04422285407781601, -0.043177537620067596, -0.04213222488760948, -0.04108690842986107, -0.040041591972112656, -0.03899627551436424, -0.03795095905661583, -0.036905642598867416, -0.035860326141119, -0.03481501340866089, -0.033769696950912476, -0.03272438049316406, -0.03167906403541565, -0.030633747577667236, -0.029588431119918823, -0.02854311466217041, -0.027497800067067146, -0.026452483609318733, -0.02540716715157032, -0.024361852556467056, -0.023316536098718643, -0.02227121964097023, -0.021225903183221817, -0.020180586725473404, -0.01913527213037014, -0.018089955672621727, -0.017044639214873314, -0.01599932461977005, -0.014954008162021637, -0.01390869077295065, -0.01286337524652481, -0.011818058788776398, -0.010772742331027985, -0.009727426804602146, -0.008682111278176308, -0.007636794820427895, -0.006591478828340769, -0.005546162836253643, -0.004500846844166517, -0.0034555308520793915, -0.0024102148599922657, -0.00136489886790514, -0.00031958287581801414, 0.0007257331162691116, 0.0017710491083562374, 0.0028163648676127195]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 5.0, 10.0, 10.0, 7.0, 14.0, 16.0, 10.0, 20.0, 23.0, 30.0, 30.0, 40.0, 43.0, 39.0, 46.0, 52.0, 52.0, 73.0, 50.0, 55.0, 41.0, 35.0, 49.0, 40.0, 40.0, 31.0, 35.0, 22.0, 18.0, 14.0, 11.0, 13.0, 12.0, 3.0, 4.0, 8.0, 1.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001860976219177246, -0.0017893752083182335, -0.0017177741974592209, -0.0016461731866002083, -0.0015745721757411957, -0.001502971164882183, -0.0014313701540231705, -0.0013597691431641579, -0.0012881681323051453, -0.0012165671214461327, -0.00114496611058712, -0.0010733650997281075, -0.0010017640888690948, -0.0009301630780100822, -0.0008585620671510696, -0.000786961056292057, -0.0007153600454330444, -0.0006437590345740318, -0.0005721580237150192, -0.0005005570128560066, -0.000428956001996994, -0.0003573549911379814, -0.0002857539802789688, -0.0002141529694199562, -0.0001425519585609436, -7.0950947701931e-05, 6.50063157081604e-07, 7.225107401609421e-05, 0.0001438520848751068, 0.00021545309573411942, 0.000287054106593132, 0.0003586551174521446, 0.0004302561283111572, 0.0005018571391701698, 0.0005734581500291824, 0.000645059160888195, 0.0007166601717472076, 0.0007882611826062202, 0.0008598621934652328, 0.0009314632043242455, 0.001003064215183258, 0.0010746652260422707, 0.0011462662369012833, 0.0012178672477602959, 0.0012894682586193085, 0.001361069269478321, 0.0014326702803373337, 0.0015042712911963463, 0.0015758723020553589, 0.0016474733129143715, 0.001719074323773384, 0.0017906753346323967, 0.0018622763454914093, 0.001933877356350422, 0.0020054783672094345, 0.002077079378068447, 0.0021486803889274597, 0.0022202813997864723, 0.002291882410645485, 0.0023634834215044975, 0.00243508443236351, 0.0025066854432225227, 0.0025782864540815353, 0.002649887464940548, 0.0027214884757995605]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 8.0, 6.0, 2.0, 2.0, 5.0, 8.0, 8.0, 8.0, 9.0, 13.0, 16.0, 19.0, 18.0, 25.0, 30.0, 26.0, 35.0, 34.0, 36.0, 38.0, 37.0, 45.0, 43.0, 41.0, 45.0, 39.0, 63.0, 40.0, 46.0, 32.0, 23.0, 26.0, 24.0, 29.0, 19.0, 15.0, 16.0, 12.0, 8.0, 9.0, 7.0, 12.0, 7.0, 4.0, 4.0, 5.0, 3.0, 2.0, 0.0, 0.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.53515625, -6.3214111328125, -6.107666015625, -5.8939208984375, -5.68017578125, -5.4664306640625, -5.252685546875, -5.0389404296875, -4.8251953125, -4.6114501953125, -4.397705078125, -4.1839599609375, -3.97021484375, -3.7564697265625, -3.542724609375, -3.3289794921875, -3.115234375, -2.9014892578125, -2.687744140625, -2.4739990234375, -2.26025390625, -2.0465087890625, -1.832763671875, -1.6190185546875, -1.4052734375, -1.1915283203125, -0.977783203125, -0.7640380859375, -0.55029296875, -0.3365478515625, -0.122802734375, 0.0909423828125, 0.3046875, 0.5184326171875, 0.732177734375, 0.9459228515625, 1.15966796875, 1.3734130859375, 1.587158203125, 1.8009033203125, 2.0146484375, 2.2283935546875, 2.442138671875, 2.6558837890625, 2.86962890625, 3.0833740234375, 3.297119140625, 3.5108642578125, 3.724609375, 3.9383544921875, 4.152099609375, 4.3658447265625, 4.57958984375, 4.7933349609375, 5.007080078125, 5.2208251953125, 5.4345703125, 5.6483154296875, 5.862060546875, 6.0758056640625, 6.28955078125, 6.5032958984375, 6.717041015625, 6.9307861328125, 7.14453125]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 6.0, 5.0, 9.0, 10.0, 10.0, 17.0, 23.0, 35.0, 31.0, 61.0, 107.0, 158.0, 281.0, 513.0, 916.0, 1770.0, 3797.0, 7901.0, 17252.0, 39542.0, 98640.0, 309182.0, 369647.0, 115727.0, 45733.0, 19661.0, 8954.0, 4176.0, 2034.0, 986.0, 553.0, 294.0, 182.0, 110.0, 67.0, 44.0, 37.0, 12.0, 15.0, 15.0, 15.0, 7.0, 4.0, 5.0, 5.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.05859375, -5.857177734375, -5.65576171875, -5.454345703125, -5.2529296875, -5.051513671875, -4.85009765625, -4.648681640625, -4.447265625, -4.245849609375, -4.04443359375, -3.843017578125, -3.6416015625, -3.440185546875, -3.23876953125, -3.037353515625, -2.8359375, -2.634521484375, -2.43310546875, -2.231689453125, -2.0302734375, -1.828857421875, -1.62744140625, -1.426025390625, -1.224609375, -1.023193359375, -0.82177734375, -0.620361328125, -0.4189453125, -0.217529296875, -0.01611328125, 0.185302734375, 0.38671875, 0.588134765625, 0.78955078125, 0.990966796875, 1.1923828125, 1.393798828125, 1.59521484375, 1.796630859375, 1.998046875, 2.199462890625, 2.40087890625, 2.602294921875, 2.8037109375, 3.005126953125, 3.20654296875, 3.407958984375, 3.609375, 3.810791015625, 4.01220703125, 4.213623046875, 4.4150390625, 4.616455078125, 4.81787109375, 5.019287109375, 5.220703125, 5.422119140625, 5.62353515625, 5.824951171875, 6.0263671875, 6.227783203125, 6.42919921875, 6.630615234375, 6.83203125]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 6.0, 4.0, 6.0, 4.0, 13.0, 17.0, 22.0, 18.0, 23.0, 24.0, 30.0, 27.0, 33.0, 39.0, 40.0, 47.0, 50.0, 75.0, 246.0, 1605.0, 190.0, 83.0, 53.0, 43.0, 47.0, 44.0, 39.0, 28.0, 33.0, 26.0, 20.0, 23.0, 18.0, 14.0, 6.0, 16.0, 6.0, 8.0, 9.0, 1.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-23.078125, -22.40673828125, -21.7353515625, -21.06396484375, -20.392578125, -19.72119140625, -19.0498046875, -18.37841796875, -17.70703125, -17.03564453125, -16.3642578125, -15.69287109375, -15.021484375, -14.35009765625, -13.6787109375, -13.00732421875, -12.3359375, -11.66455078125, -10.9931640625, -10.32177734375, -9.650390625, -8.97900390625, -8.3076171875, -7.63623046875, -6.96484375, -6.29345703125, -5.6220703125, -4.95068359375, -4.279296875, -3.60791015625, -2.9365234375, -2.26513671875, -1.59375, -0.92236328125, -0.2509765625, 0.42041015625, 1.091796875, 1.76318359375, 2.4345703125, 3.10595703125, 3.77734375, 4.44873046875, 5.1201171875, 5.79150390625, 6.462890625, 7.13427734375, 7.8056640625, 8.47705078125, 9.1484375, 9.81982421875, 10.4912109375, 11.16259765625, 11.833984375, 12.50537109375, 13.1767578125, 13.84814453125, 14.51953125, 15.19091796875, 15.8623046875, 16.53369140625, 17.205078125, 17.87646484375, 18.5478515625, 19.21923828125, 19.890625]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 6.0, 3.0, 12.0, 11.0, 9.0, 10.0, 14.0, 15.0, 28.0, 27.0, 28.0, 48.0, 46.0, 88.0, 87.0, 145.0, 170.0, 193.0, 348.0, 631.0, 2735.0, 78505.0, 3007643.0, 50891.0, 2279.0, 578.0, 311.0, 201.0, 149.0, 124.0, 63.0, 62.0, 53.0, 40.0, 31.0, 29.0, 28.0, 12.0, 7.0, 10.0, 11.0, 4.0, 5.0, 5.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-33.0, -31.87939453125, -30.7587890625, -29.63818359375, -28.517578125, -27.39697265625, -26.2763671875, -25.15576171875, -24.03515625, -22.91455078125, -21.7939453125, -20.67333984375, -19.552734375, -18.43212890625, -17.3115234375, -16.19091796875, -15.0703125, -13.94970703125, -12.8291015625, -11.70849609375, -10.587890625, -9.46728515625, -8.3466796875, -7.22607421875, -6.10546875, -4.98486328125, -3.8642578125, -2.74365234375, -1.623046875, -0.50244140625, 0.6181640625, 1.73876953125, 2.859375, 3.97998046875, 5.1005859375, 6.22119140625, 7.341796875, 8.46240234375, 9.5830078125, 10.70361328125, 11.82421875, 12.94482421875, 14.0654296875, 15.18603515625, 16.306640625, 17.42724609375, 18.5478515625, 19.66845703125, 20.7890625, 21.90966796875, 23.0302734375, 24.15087890625, 25.271484375, 26.39208984375, 27.5126953125, 28.63330078125, 29.75390625, 30.87451171875, 31.9951171875, 33.11572265625, 34.236328125, 35.35693359375, 36.4775390625, 37.59814453125, 38.71875]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 171.0, 722.0, 119.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-268.3849792480469, -263.5423583984375, -258.6997375488281, -253.8571014404297, -249.01446533203125, -244.17184448242188, -239.32920837402344, -234.48658752441406, -229.64395141601562, -224.80133056640625, -219.9586944580078, -215.11607360839844, -210.2734375, -205.43081665039062, -200.5881805419922, -195.7455596923828, -190.90293884277344, -186.06031799316406, -181.21768188476562, -176.37506103515625, -171.5324249267578, -166.68980407714844, -161.84716796875, -157.00454711914062, -152.16192626953125, -147.31930541992188, -142.47666931152344, -137.63404846191406, -132.79141235351562, -127.94879150390625, -123.10616302490234, -118.26353454589844, -113.42090606689453, -108.57827758789062, -103.73564910888672, -98.89302062988281, -94.05039978027344, -89.207763671875, -84.36514282226562, -79.52251434326172, -74.67988586425781, -69.8372573852539, -64.99462890625, -60.15200424194336, -55.30937576293945, -50.46674728393555, -45.624122619628906, -40.781494140625, -35.938865661621094, -31.096237182617188, -26.253610610961914, -21.41098403930664, -16.568355560302734, -11.725727081298828, -6.883100509643555, -2.0404739379882812, 2.802154541015625, 7.644782066345215, 12.487409591674805, 17.330036163330078, 22.172664642333984, 27.01529312133789, 31.857919692993164, 36.70054626464844, 41.543174743652344]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 6.0, 2.0, 3.0, 10.0, 10.0, 11.0, 5.0, 11.0, 12.0, 19.0, 21.0, 16.0, 18.0, 25.0, 29.0, 37.0, 20.0, 35.0, 33.0, 33.0, 34.0, 48.0, 36.0, 41.0, 43.0, 33.0, 36.0, 41.0, 38.0, 30.0, 34.0, 22.0, 21.0, 32.0, 22.0, 13.0, 22.0, 14.0, 14.0, 10.0, 12.0, 11.0, 14.0, 15.0, 7.0, 3.0, 4.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-50.861915588378906, -49.33371353149414, -47.80550765991211, -46.277305603027344, -44.74910354614258, -43.22089767456055, -41.69269561767578, -40.16448974609375, -38.636287689208984, -37.10808563232422, -35.57987976074219, -34.05167770385742, -32.523475646972656, -30.995269775390625, -29.46706771850586, -27.93886375427246, -26.410661697387695, -24.882457733154297, -23.35425567626953, -21.826051712036133, -20.297847747802734, -18.76964569091797, -17.24144172668457, -15.713237762451172, -14.18503475189209, -12.656831741333008, -11.12862777709961, -9.600424766540527, -8.072221755981445, -6.544017791748047, -5.015814781188965, -3.4876108169555664, -1.9594078063964844, -0.4312044382095337, 1.096998929977417, 2.625202178955078, 4.153405666351318, 5.681609153747559, 7.209812164306641, 8.738016128540039, 10.266219139099121, 11.794422149658203, 13.322626113891602, 14.850829124450684, 16.379032135009766, 17.907236099243164, 19.435440063476562, 20.963642120361328, 22.491846084594727, 24.020050048828125, 25.54825210571289, 27.07645606994629, 28.604660034179688, 30.132862091064453, 31.66106605529785, 33.18927001953125, 34.717472076416016, 36.24567413330078, 37.77388000488281, 39.30208206176758, 40.830284118652344, 42.358489990234375, 43.88669204711914, 45.414894104003906, 46.94309997558594]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 4.0, 3.0, 2.0, 6.0, 4.0, 5.0, 9.0, 3.0, 9.0, 5.0, 9.0, 18.0, 8.0, 17.0, 25.0, 24.0, 22.0, 23.0, 30.0, 30.0, 45.0, 36.0, 35.0, 52.0, 41.0, 47.0, 45.0, 50.0, 34.0, 40.0, 39.0, 31.0, 33.0, 29.0, 25.0, 34.0, 16.0, 17.0, 15.0, 15.0, 11.0, 10.0, 9.0, 8.0, 7.0, 9.0, 6.0, 7.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0], "bins": [-6.47265625, -6.2568359375, -6.041015625, -5.8251953125, -5.609375, -5.3935546875, -5.177734375, -4.9619140625, -4.74609375, -4.5302734375, -4.314453125, -4.0986328125, -3.8828125, -3.6669921875, -3.451171875, -3.2353515625, -3.01953125, -2.8037109375, -2.587890625, -2.3720703125, -2.15625, -1.9404296875, -1.724609375, -1.5087890625, -1.29296875, -1.0771484375, -0.861328125, -0.6455078125, -0.4296875, -0.2138671875, 0.001953125, 0.2177734375, 0.43359375, 0.6494140625, 0.865234375, 1.0810546875, 1.296875, 1.5126953125, 1.728515625, 1.9443359375, 2.16015625, 2.3759765625, 2.591796875, 2.8076171875, 3.0234375, 3.2392578125, 3.455078125, 3.6708984375, 3.88671875, 4.1025390625, 4.318359375, 4.5341796875, 4.75, 4.9658203125, 5.181640625, 5.3974609375, 5.61328125, 5.8291015625, 6.044921875, 6.2607421875, 6.4765625, 6.6923828125, 6.908203125, 7.1240234375, 7.33984375]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 6.0, 7.0, 8.0, 8.0, 7.0, 15.0, 15.0, 21.0, 24.0, 18.0, 35.0, 41.0, 47.0, 79.0, 129.0, 274.0, 619.0, 1559.0, 6461.0, 37763.0, 524763.0, 3077826.0, 499595.0, 35799.0, 6166.0, 1636.0, 615.0, 252.0, 138.0, 91.0, 38.0, 36.0, 44.0, 27.0, 24.0, 18.0, 18.0, 11.0, 8.0, 10.0, 2.0, 7.0, 4.0, 5.0, 8.0, 2.0, 4.0, 1.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.734375, -17.133056640625, -16.53173828125, -15.930419921875, -15.3291015625, -14.727783203125, -14.12646484375, -13.525146484375, -12.923828125, -12.322509765625, -11.72119140625, -11.119873046875, -10.5185546875, -9.917236328125, -9.31591796875, -8.714599609375, -8.11328125, -7.511962890625, -6.91064453125, -6.309326171875, -5.7080078125, -5.106689453125, -4.50537109375, -3.904052734375, -3.302734375, -2.701416015625, -2.10009765625, -1.498779296875, -0.8974609375, -0.296142578125, 0.30517578125, 0.906494140625, 1.5078125, 2.109130859375, 2.71044921875, 3.311767578125, 3.9130859375, 4.514404296875, 5.11572265625, 5.717041015625, 6.318359375, 6.919677734375, 7.52099609375, 8.122314453125, 8.7236328125, 9.324951171875, 9.92626953125, 10.527587890625, 11.12890625, 11.730224609375, 12.33154296875, 12.932861328125, 13.5341796875, 14.135498046875, 14.73681640625, 15.338134765625, 15.939453125, 16.540771484375, 17.14208984375, 17.743408203125, 18.3447265625, 18.946044921875, 19.54736328125, 20.148681640625, 20.75]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 6.0, 5.0, 8.0, 11.0, 10.0, 13.0, 18.0, 23.0, 24.0, 31.0, 47.0, 67.0, 78.0, 88.0, 122.0, 163.0, 206.0, 272.0, 287.0, 380.0, 397.0, 346.0, 339.0, 269.0, 180.0, 138.0, 114.0, 76.0, 67.0, 69.0, 44.0, 42.0, 29.0, 28.0, 19.0, 15.0, 7.0, 10.0, 7.0, 2.0, 4.0, 3.0, 1.0, 2.0, 5.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.859375, -9.5361328125, -9.212890625, -8.8896484375, -8.56640625, -8.2431640625, -7.919921875, -7.5966796875, -7.2734375, -6.9501953125, -6.626953125, -6.3037109375, -5.98046875, -5.6572265625, -5.333984375, -5.0107421875, -4.6875, -4.3642578125, -4.041015625, -3.7177734375, -3.39453125, -3.0712890625, -2.748046875, -2.4248046875, -2.1015625, -1.7783203125, -1.455078125, -1.1318359375, -0.80859375, -0.4853515625, -0.162109375, 0.1611328125, 0.484375, 0.8076171875, 1.130859375, 1.4541015625, 1.77734375, 2.1005859375, 2.423828125, 2.7470703125, 3.0703125, 3.3935546875, 3.716796875, 4.0400390625, 4.36328125, 4.6865234375, 5.009765625, 5.3330078125, 5.65625, 5.9794921875, 6.302734375, 6.6259765625, 6.94921875, 7.2724609375, 7.595703125, 7.9189453125, 8.2421875, 8.5654296875, 8.888671875, 9.2119140625, 9.53515625, 9.8583984375, 10.181640625, 10.5048828125, 10.828125]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 4.0, 8.0, 9.0, 8.0, 11.0, 15.0, 14.0, 38.0, 44.0, 70.0, 79.0, 105.0, 143.0, 176.0, 265.0, 354.0, 1115.0, 13381.0, 2391994.0, 1772393.0, 11662.0, 983.0, 379.0, 296.0, 178.0, 147.0, 105.0, 75.0, 64.0, 53.0, 34.0, 22.0, 17.0, 15.0, 11.0, 8.0, 7.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-62.75, -61.005859375, -59.26171875, -57.517578125, -55.7734375, -54.029296875, -52.28515625, -50.541015625, -48.796875, -47.052734375, -45.30859375, -43.564453125, -41.8203125, -40.076171875, -38.33203125, -36.587890625, -34.84375, -33.099609375, -31.35546875, -29.611328125, -27.8671875, -26.123046875, -24.37890625, -22.634765625, -20.890625, -19.146484375, -17.40234375, -15.658203125, -13.9140625, -12.169921875, -10.42578125, -8.681640625, -6.9375, -5.193359375, -3.44921875, -1.705078125, 0.0390625, 1.783203125, 3.52734375, 5.271484375, 7.015625, 8.759765625, 10.50390625, 12.248046875, 13.9921875, 15.736328125, 17.48046875, 19.224609375, 20.96875, 22.712890625, 24.45703125, 26.201171875, 27.9453125, 29.689453125, 31.43359375, 33.177734375, 34.921875, 36.666015625, 38.41015625, 40.154296875, 41.8984375, 43.642578125, 45.38671875, 47.130859375, 48.875]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 19.0, 210.0, 500.0, 243.0, 37.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-323.2208557128906, -316.421630859375, -309.6224060058594, -302.82318115234375, -296.02398681640625, -289.2247619628906, -282.425537109375, -275.6263122558594, -268.82708740234375, -262.0278625488281, -255.22865295410156, -248.42942810058594, -241.6302032470703, -234.83099365234375, -228.03176879882812, -221.2325439453125, -214.433349609375, -207.63412475585938, -200.8349151611328, -194.0356903076172, -187.23646545410156, -180.437255859375, -173.63803100585938, -166.83880615234375, -160.03958129882812, -153.2403564453125, -146.44114685058594, -139.6419219970703, -132.8426971435547, -126.04348754882812, -119.2442626953125, -112.4450454711914, -105.64582061767578, -98.84660339355469, -92.04737854003906, -85.24816131591797, -78.44894409179688, -71.64971923828125, -64.85050201416016, -58.05128479003906, -51.2520637512207, -44.452842712402344, -37.65362548828125, -30.85440444946289, -24.055185317993164, -17.255966186523438, -10.456745147705078, -3.6575279235839844, 3.141693115234375, 9.940912246704102, 16.740131378173828, 23.539352416992188, 30.338571548461914, 37.13779067993164, 43.93701171875, 50.736228942871094, 57.53544998168945, 64.33467102050781, 71.1338882446289, 77.93310546875, 84.73233032226562, 91.53154754638672, 98.33076477050781, 105.12998962402344, 111.92920684814453]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 4.0, 6.0, 7.0, 7.0, 15.0, 14.0, 11.0, 21.0, 20.0, 23.0, 23.0, 33.0, 31.0, 34.0, 31.0, 39.0, 26.0, 33.0, 33.0, 32.0, 45.0, 37.0, 54.0, 38.0, 48.0, 35.0, 21.0, 31.0, 37.0, 28.0, 29.0, 20.0, 25.0, 20.0, 17.0, 20.0, 9.0, 6.0, 5.0, 7.0, 4.0, 3.0, 8.0, 3.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-39.93975830078125, -38.61375427246094, -37.287750244140625, -35.96174621582031, -34.6357421875, -33.30973434448242, -31.98373031616211, -30.657726287841797, -29.331722259521484, -28.005718231201172, -26.67971420288086, -25.353708267211914, -24.0277042388916, -22.70170021057129, -21.375694274902344, -20.04969024658203, -18.72368621826172, -17.397682189941406, -16.071678161621094, -14.745672225952148, -13.419668197631836, -12.093664169311523, -10.767659187316895, -9.441654205322266, -8.115650177001953, -6.789645671844482, -5.463641166687012, -4.137636661529541, -2.8116321563720703, -1.4856276512145996, -0.1596231460571289, 1.1663818359375, 2.4923858642578125, 3.818390369415283, 5.144394874572754, 6.470399379730225, 7.796403884887695, 9.122407913208008, 10.448412895202637, 11.774417877197266, 13.100421905517578, 14.42642593383789, 15.75243091583252, 17.07843589782715, 18.40443992614746, 19.730443954467773, 21.05644989013672, 22.38245391845703, 23.708457946777344, 25.034461975097656, 26.36046600341797, 27.686471939086914, 29.012475967407227, 30.33847999572754, 31.664485931396484, 32.9904899597168, 34.31649398803711, 35.64249801635742, 36.968502044677734, 38.29450607299805, 39.620513916015625, 40.94651794433594, 42.27252197265625, 43.59852600097656, 44.924530029296875]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 4.0, 2.0, 8.0, 9.0, 8.0, 11.0, 15.0, 15.0, 8.0, 15.0, 20.0, 15.0, 26.0, 28.0, 37.0, 36.0, 27.0, 41.0, 38.0, 38.0, 44.0, 57.0, 42.0, 42.0, 37.0, 49.0, 37.0, 42.0, 31.0, 29.0, 28.0, 25.0, 22.0, 23.0, 7.0, 19.0, 10.0, 10.0, 12.0, 9.0, 13.0, 4.0, 3.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0], "bins": [-7.6328125, -7.4022216796875, -7.171630859375, -6.9410400390625, -6.71044921875, -6.4798583984375, -6.249267578125, -6.0186767578125, -5.7880859375, -5.5574951171875, -5.326904296875, -5.0963134765625, -4.86572265625, -4.6351318359375, -4.404541015625, -4.1739501953125, -3.943359375, -3.7127685546875, -3.482177734375, -3.2515869140625, -3.02099609375, -2.7904052734375, -2.559814453125, -2.3292236328125, -2.0986328125, -1.8680419921875, -1.637451171875, -1.4068603515625, -1.17626953125, -0.9456787109375, -0.715087890625, -0.4844970703125, -0.25390625, -0.0233154296875, 0.207275390625, 0.4378662109375, 0.66845703125, 0.8990478515625, 1.129638671875, 1.3602294921875, 1.5908203125, 1.8214111328125, 2.052001953125, 2.2825927734375, 2.51318359375, 2.7437744140625, 2.974365234375, 3.2049560546875, 3.435546875, 3.6661376953125, 3.896728515625, 4.1273193359375, 4.35791015625, 4.5885009765625, 4.819091796875, 5.0496826171875, 5.2802734375, 5.5108642578125, 5.741455078125, 5.9720458984375, 6.20263671875, 6.4332275390625, 6.663818359375, 6.8944091796875, 7.125]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 4.0, 7.0, 7.0, 19.0, 20.0, 29.0, 47.0, 75.0, 97.0, 160.0, 221.0, 346.0, 565.0, 846.0, 1405.0, 2005.0, 3142.0, 4988.0, 7669.0, 11979.0, 18687.0, 29086.0, 45537.0, 71464.0, 109937.0, 154187.0, 173919.0, 141053.0, 97030.0, 62404.0, 40440.0, 25604.0, 16204.0, 10365.0, 6839.0, 4295.0, 2744.0, 1812.0, 1166.0, 739.0, 496.0, 315.0, 197.0, 147.0, 89.0, 64.0, 30.0, 28.0, 13.0, 16.0, 5.0, 9.0, 6.0, 8.0], "bins": [-0.76904296875, -0.7478866577148438, -0.7267303466796875, -0.7055740356445312, -0.684417724609375, -0.6632614135742188, -0.6421051025390625, -0.6209487915039062, -0.59979248046875, -0.5786361694335938, -0.5574798583984375, -0.5363235473632812, -0.515167236328125, -0.49401092529296875, -0.4728546142578125, -0.45169830322265625, -0.4305419921875, -0.40938568115234375, -0.3882293701171875, -0.36707305908203125, -0.345916748046875, -0.32476043701171875, -0.3036041259765625, -0.28244781494140625, -0.26129150390625, -0.24013519287109375, -0.2189788818359375, -0.19782257080078125, -0.176666259765625, -0.15550994873046875, -0.1343536376953125, -0.11319732666015625, -0.092041015625, -0.07088470458984375, -0.0497283935546875, -0.02857208251953125, -0.007415771484375, 0.01374053955078125, 0.0348968505859375, 0.05605316162109375, 0.07720947265625, 0.09836578369140625, 0.1195220947265625, 0.14067840576171875, 0.161834716796875, 0.18299102783203125, 0.2041473388671875, 0.22530364990234375, 0.2464599609375, 0.26761627197265625, 0.2887725830078125, 0.30992889404296875, 0.331085205078125, 0.35224151611328125, 0.3733978271484375, 0.39455413818359375, 0.41571044921875, 0.43686676025390625, 0.4580230712890625, 0.47917938232421875, 0.500335693359375, 0.5214920043945312, 0.5426483154296875, 0.5638046264648438, 0.5849609375]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 7.0, 3.0, 2.0, 3.0, 10.0, 6.0, 8.0, 11.0, 12.0, 17.0, 17.0, 26.0, 26.0, 20.0, 39.0, 31.0, 37.0, 36.0, 46.0, 37.0, 43.0, 34.0, 41.0, 1064.0, 47.0, 42.0, 39.0, 45.0, 34.0, 30.0, 30.0, 30.0, 21.0, 12.0, 23.0, 15.0, 19.0, 14.0, 16.0, 6.0, 13.0, 6.0, 4.0, 4.0, 4.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.015625, -4.864013671875, -4.71240234375, -4.560791015625, -4.4091796875, -4.257568359375, -4.10595703125, -3.954345703125, -3.802734375, -3.651123046875, -3.49951171875, -3.347900390625, -3.1962890625, -3.044677734375, -2.89306640625, -2.741455078125, -2.58984375, -2.438232421875, -2.28662109375, -2.135009765625, -1.9833984375, -1.831787109375, -1.68017578125, -1.528564453125, -1.376953125, -1.225341796875, -1.07373046875, -0.922119140625, -0.7705078125, -0.618896484375, -0.46728515625, -0.315673828125, -0.1640625, -0.012451171875, 0.13916015625, 0.290771484375, 0.4423828125, 0.593994140625, 0.74560546875, 0.897216796875, 1.048828125, 1.200439453125, 1.35205078125, 1.503662109375, 1.6552734375, 1.806884765625, 1.95849609375, 2.110107421875, 2.26171875, 2.413330078125, 2.56494140625, 2.716552734375, 2.8681640625, 3.019775390625, 3.17138671875, 3.322998046875, 3.474609375, 3.626220703125, 3.77783203125, 3.929443359375, 4.0810546875, 4.232666015625, 4.38427734375, 4.535888671875, 4.6875]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 7.0, 8.0, 9.0, 16.0, 36.0, 44.0, 78.0, 128.0, 196.0, 337.0, 638.0, 1046.0, 1929.0, 3436.0, 5730.0, 9936.0, 16706.0, 29097.0, 48792.0, 80270.0, 126686.0, 184959.0, 1219194.0, 140062.0, 92006.0, 56130.0, 33060.0, 19352.0, 11491.0, 6638.0, 3877.0, 2155.0, 1279.0, 766.0, 448.0, 214.0, 164.0, 94.0, 54.0, 31.0, 21.0, 9.0, 6.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.57275390625, -0.5530929565429688, -0.5334320068359375, -0.5137710571289062, -0.494110107421875, -0.47444915771484375, -0.4547882080078125, -0.43512725830078125, -0.41546630859375, -0.39580535888671875, -0.3761444091796875, -0.35648345947265625, -0.336822509765625, -0.31716156005859375, -0.2975006103515625, -0.27783966064453125, -0.2581787109375, -0.23851776123046875, -0.2188568115234375, -0.19919586181640625, -0.179534912109375, -0.15987396240234375, -0.1402130126953125, -0.12055206298828125, -0.10089111328125, -0.08123016357421875, -0.0615692138671875, -0.04190826416015625, -0.022247314453125, -0.00258636474609375, 0.0170745849609375, 0.03673553466796875, 0.056396484375, 0.07605743408203125, 0.0957183837890625, 0.11537933349609375, 0.135040283203125, 0.15470123291015625, 0.1743621826171875, 0.19402313232421875, 0.21368408203125, 0.23334503173828125, 0.2530059814453125, 0.27266693115234375, 0.292327880859375, 0.31198883056640625, 0.3316497802734375, 0.35131072998046875, 0.3709716796875, 0.39063262939453125, 0.4102935791015625, 0.42995452880859375, 0.449615478515625, 0.46927642822265625, 0.4889373779296875, 0.5085983276367188, 0.52825927734375, 0.5479202270507812, 0.5675811767578125, 0.5872421264648438, 0.606903076171875, 0.6265640258789062, 0.6462249755859375, 0.6658859252929688, 0.685546875]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 4.0, 7.0, 5.0, 4.0, 20.0, 18.0, 24.0, 23.0, 43.0, 47.0, 66.0, 61.0, 60.0, 85.0, 109.0, 88.0, 61.0, 71.0, 40.0, 31.0, 29.0, 33.0, 17.0, 12.0, 12.0, 6.0, 5.0, 5.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0063018798828125, -0.006111621856689453, -0.005921363830566406, -0.005731105804443359, -0.0055408477783203125, -0.005350589752197266, -0.005160331726074219, -0.004970073699951172, -0.004779815673828125, -0.004589557647705078, -0.004399299621582031, -0.004209041595458984, -0.0040187835693359375, -0.0038285255432128906, -0.0036382675170898438, -0.003448009490966797, -0.00325775146484375, -0.003067493438720703, -0.0028772354125976562, -0.0026869773864746094, -0.0024967193603515625, -0.0023064613342285156, -0.0021162033081054688, -0.0019259452819824219, -0.001735687255859375, -0.0015454292297363281, -0.0013551712036132812, -0.0011649131774902344, -0.0009746551513671875, -0.0007843971252441406, -0.0005941390991210938, -0.0004038810729980469, -0.000213623046875, -2.3365020751953125e-05, 0.00016689300537109375, 0.0003571510314941406, 0.0005474090576171875, 0.0007376670837402344, 0.0009279251098632812, 0.0011181831359863281, 0.001308441162109375, 0.0014986991882324219, 0.0016889572143554688, 0.0018792152404785156, 0.0020694732666015625, 0.0022597312927246094, 0.0024499893188476562, 0.002640247344970703, 0.00283050537109375, 0.003020763397216797, 0.0032110214233398438, 0.0034012794494628906, 0.0035915374755859375, 0.0037817955017089844, 0.003972053527832031, 0.004162311553955078, 0.004352569580078125, 0.004542827606201172, 0.004733085632324219, 0.004923343658447266, 0.0051136016845703125, 0.005303859710693359, 0.005494117736816406, 0.005684375762939453, 0.0058746337890625]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 5.0, 8.0, 3.0, 12.0, 13.0, 16.0, 28.0, 46.0, 56.0, 60.0, 89.0, 178.0, 323.0, 939.0, 416175.0, 628706.0, 983.0, 339.0, 164.0, 120.0, 83.0, 59.0, 38.0, 23.0, 24.0, 14.0, 10.0, 5.0, 4.0, 4.0, 7.0, 6.0, 0.0, 2.0, 4.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1258544921875, -0.12179756164550781, -0.11774063110351562, -0.11368370056152344, -0.10962677001953125, -0.10556983947753906, -0.10151290893554688, -0.09745597839355469, -0.0933990478515625, -0.08934211730957031, -0.08528518676757812, -0.08122825622558594, -0.07717132568359375, -0.07311439514160156, -0.06905746459960938, -0.06500053405761719, -0.060943603515625, -0.05688667297363281, -0.052829742431640625, -0.04877281188964844, -0.04471588134765625, -0.04065895080566406, -0.036602020263671875, -0.03254508972167969, -0.0284881591796875, -0.024431228637695312, -0.020374298095703125, -0.016317367553710938, -0.01226043701171875, -0.008203506469726562, -0.004146575927734375, -8.96453857421875e-05, 0.00396728515625, 0.008024215698242188, 0.012081146240234375, 0.016138076782226562, 0.02019500732421875, 0.024251937866210938, 0.028308868408203125, 0.03236579895019531, 0.0364227294921875, 0.04047966003417969, 0.044536590576171875, 0.04859352111816406, 0.05265045166015625, 0.05670738220214844, 0.060764312744140625, 0.06482124328613281, 0.068878173828125, 0.07293510437011719, 0.07699203491210938, 0.08104896545410156, 0.08510589599609375, 0.08916282653808594, 0.09321975708007812, 0.09727668762207031, 0.1013336181640625, 0.10539054870605469, 0.10944747924804688, 0.11350440979003906, 0.11756134033203125, 0.12161827087402344, 0.12567520141601562, 0.1297321319580078, 0.1337890625]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 31.0, 195.0, 519.0, 215.0, 39.0, 12.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.024682270362973213, -0.02424539066851139, -0.023808512836694717, -0.023371633142232895, -0.022934753447771072, -0.02249787375330925, -0.022060995921492577, -0.021624116227030754, -0.02118723839521408, -0.02075035870075226, -0.020313480868935585, -0.019876601174473763, -0.01943972148001194, -0.019002843648195267, -0.018565963953733444, -0.01812908425927162, -0.0176922045648098, -0.017255324870347977, -0.016818447038531303, -0.01638156734406948, -0.01594468764960766, -0.01550780888646841, -0.015070930123329163, -0.01463405042886734, -0.014197171665728092, -0.013760292902588844, -0.013323413208127022, -0.012886534444987774, -0.012449655681848526, -0.012012775987386703, -0.011575897224247456, -0.011139018461108208, -0.01070213969796896, -0.010265260934829712, -0.00982838124036789, -0.009391502477228642, -0.008954623714089394, -0.008517744019627571, -0.008080865256488323, -0.007643986027687788, -0.007207106798887253, -0.006770227570086718, -0.006333348341286182, -0.0058964695781469345, -0.005459590349346399, -0.005022711120545864, -0.004585832357406616, -0.004148953128606081, -0.003712073899805546, -0.0032751946710050106, -0.002838315675035119, -0.0024014366790652275, -0.0019645574502646923, -0.001527678221464157, -0.0010907992254942656, -0.000653920229524374, -0.0002170410007238388, 0.00021983811166137457, 0.0006567172240465879, 0.0010935963364318013, 0.0015304754488170147, 0.00196735467761755, 0.0024042336735874414, 0.002841112669557333, 0.003277991898357868]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 4.0, 3.0, 5.0, 9.0, 12.0, 20.0, 21.0, 24.0, 27.0, 24.0, 32.0, 51.0, 50.0, 50.0, 53.0, 70.0, 58.0, 60.0, 55.0, 56.0, 48.0, 40.0, 43.0, 33.0, 35.0, 26.0, 16.0, 25.0, 9.0, 10.0, 13.0, 9.0, 6.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003043830394744873, -0.0029310202226042747, -0.0028182100504636765, -0.002705399878323078, -0.00259258970618248, -0.0024797795340418816, -0.0023669693619012833, -0.002254159189760685, -0.0021413490176200867, -0.0020285388454794884, -0.00191572867333889, -0.0018029185011982918, -0.0016901083290576935, -0.0015772981569170952, -0.0014644879847764969, -0.0013516778126358986, -0.0012388676404953003, -0.001126057468354702, -0.0010132472962141037, -0.0009004371240735054, -0.0007876269519329071, -0.0006748167797923088, -0.0005620066076517105, -0.0004491964355111122, -0.0003363862633705139, -0.00022357609122991562, -0.00011076591908931732, 2.0442530512809753e-06, 0.00011485442519187927, 0.00022766459733247757, 0.00034047476947307587, 0.00045328494161367416, 0.0005660951137542725, 0.0006789052858948708, 0.0007917154580354691, 0.0009045256301760674, 0.0010173358023166656, 0.001130145974457264, 0.0012429561465978622, 0.0013557663187384605, 0.0014685764908790588, 0.0015813866630196571, 0.0016941968351602554, 0.0018070070073008537, 0.001919817179441452, 0.0020326273515820503, 0.0021454375237226486, 0.002258247695863247, 0.002371057868003845, 0.0024838680401444435, 0.002596678212285042, 0.00270948838442564, 0.0028222985565662384, 0.0029351087287068367, 0.003047918900847435, 0.0031607290729880333, 0.0032735392451286316, 0.00338634941726923, 0.003499159589409828, 0.0036119697615504265, 0.0037247799336910248, 0.003837590105831623, 0.003950400277972221, 0.00406321045011282, 0.004176020622253418]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 4.0, 2.0, 8.0, 9.0, 8.0, 11.0, 15.0, 15.0, 8.0, 15.0, 20.0, 15.0, 26.0, 28.0, 37.0, 36.0, 27.0, 41.0, 38.0, 38.0, 44.0, 57.0, 42.0, 43.0, 36.0, 49.0, 37.0, 42.0, 31.0, 29.0, 28.0, 25.0, 22.0, 23.0, 7.0, 19.0, 10.0, 10.0, 12.0, 9.0, 13.0, 4.0, 3.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0], "bins": [-7.6328125, -7.4022216796875, -7.171630859375, -6.9410400390625, -6.71044921875, -6.4798583984375, -6.249267578125, -6.0186767578125, -5.7880859375, -5.5574951171875, -5.326904296875, -5.0963134765625, -4.86572265625, -4.6351318359375, -4.404541015625, -4.1739501953125, -3.943359375, -3.7127685546875, -3.482177734375, -3.2515869140625, -3.02099609375, -2.7904052734375, -2.559814453125, -2.3292236328125, -2.0986328125, -1.8680419921875, -1.637451171875, -1.4068603515625, -1.17626953125, -0.9456787109375, -0.715087890625, -0.4844970703125, -0.25390625, -0.0233154296875, 0.207275390625, 0.4378662109375, 0.66845703125, 0.8990478515625, 1.129638671875, 1.3602294921875, 1.5908203125, 1.8214111328125, 2.052001953125, 2.2825927734375, 2.51318359375, 2.7437744140625, 2.974365234375, 3.2049560546875, 3.435546875, 3.6661376953125, 3.896728515625, 4.1273193359375, 4.35791015625, 4.5885009765625, 4.819091796875, 5.0496826171875, 5.2802734375, 5.5108642578125, 5.741455078125, 5.9720458984375, 6.20263671875, 6.4332275390625, 6.663818359375, 6.8944091796875, 7.125]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 0.0, 3.0, 5.0, 2.0, 10.0, 11.0, 6.0, 11.0, 20.0, 21.0, 20.0, 17.0, 46.0, 51.0, 56.0, 78.0, 129.0, 190.0, 270.0, 510.0, 1322.0, 4434.0, 18351.0, 111371.0, 774742.0, 111073.0, 18458.0, 4495.0, 1354.0, 564.0, 299.0, 160.0, 111.0, 87.0, 66.0, 56.0, 30.0, 31.0, 21.0, 19.0, 12.0, 16.0, 10.0, 8.0, 3.0, 1.0, 6.0, 2.0, 1.0, 3.0, 0.0, 0.0, 3.0, 2.0, 1.0], "bins": [-15.1796875, -14.7265625, -14.2734375, -13.8203125, -13.3671875, -12.9140625, -12.4609375, -12.0078125, -11.5546875, -11.1015625, -10.6484375, -10.1953125, -9.7421875, -9.2890625, -8.8359375, -8.3828125, -7.9296875, -7.4765625, -7.0234375, -6.5703125, -6.1171875, -5.6640625, -5.2109375, -4.7578125, -4.3046875, -3.8515625, -3.3984375, -2.9453125, -2.4921875, -2.0390625, -1.5859375, -1.1328125, -0.6796875, -0.2265625, 0.2265625, 0.6796875, 1.1328125, 1.5859375, 2.0390625, 2.4921875, 2.9453125, 3.3984375, 3.8515625, 4.3046875, 4.7578125, 5.2109375, 5.6640625, 6.1171875, 6.5703125, 7.0234375, 7.4765625, 7.9296875, 8.3828125, 8.8359375, 9.2890625, 9.7421875, 10.1953125, 10.6484375, 11.1015625, 11.5546875, 12.0078125, 12.4609375, 12.9140625, 13.3671875, 13.8203125]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 7.0, 3.0, 4.0, 7.0, 5.0, 12.0, 14.0, 14.0, 18.0, 18.0, 23.0, 33.0, 30.0, 48.0, 41.0, 44.0, 53.0, 51.0, 79.0, 227.0, 1699.0, 158.0, 76.0, 64.0, 40.0, 36.0, 37.0, 35.0, 28.0, 23.0, 24.0, 25.0, 20.0, 9.0, 7.0, 13.0, 5.0, 9.0, 5.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.109375, -22.375244140625, -21.64111328125, -20.906982421875, -20.1728515625, -19.438720703125, -18.70458984375, -17.970458984375, -17.236328125, -16.502197265625, -15.76806640625, -15.033935546875, -14.2998046875, -13.565673828125, -12.83154296875, -12.097412109375, -11.36328125, -10.629150390625, -9.89501953125, -9.160888671875, -8.4267578125, -7.692626953125, -6.95849609375, -6.224365234375, -5.490234375, -4.756103515625, -4.02197265625, -3.287841796875, -2.5537109375, -1.819580078125, -1.08544921875, -0.351318359375, 0.3828125, 1.116943359375, 1.85107421875, 2.585205078125, 3.3193359375, 4.053466796875, 4.78759765625, 5.521728515625, 6.255859375, 6.989990234375, 7.72412109375, 8.458251953125, 9.1923828125, 9.926513671875, 10.66064453125, 11.394775390625, 12.12890625, 12.863037109375, 13.59716796875, 14.331298828125, 15.0654296875, 15.799560546875, 16.53369140625, 17.267822265625, 18.001953125, 18.736083984375, 19.47021484375, 20.204345703125, 20.9384765625, 21.672607421875, 22.40673828125, 23.140869140625, 23.875]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 7.0, 10.0, 10.0, 10.0, 6.0, 8.0, 24.0, 28.0, 24.0, 53.0, 47.0, 55.0, 71.0, 120.0, 183.0, 371.0, 1139.0, 27149.0, 3096117.0, 18180.0, 1026.0, 374.0, 178.0, 133.0, 94.0, 62.0, 45.0, 36.0, 32.0, 22.0, 25.0, 15.0, 16.0, 7.0, 7.0, 7.0, 3.0, 5.0, 8.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-55.78125, -54.0625, -52.34375, -50.625, -48.90625, -47.1875, -45.46875, -43.75, -42.03125, -40.3125, -38.59375, -36.875, -35.15625, -33.4375, -31.71875, -30.0, -28.28125, -26.5625, -24.84375, -23.125, -21.40625, -19.6875, -17.96875, -16.25, -14.53125, -12.8125, -11.09375, -9.375, -7.65625, -5.9375, -4.21875, -2.5, -0.78125, 0.9375, 2.65625, 4.375, 6.09375, 7.8125, 9.53125, 11.25, 12.96875, 14.6875, 16.40625, 18.125, 19.84375, 21.5625, 23.28125, 25.0, 26.71875, 28.4375, 30.15625, 31.875, 33.59375, 35.3125, 37.03125, 38.75, 40.46875, 42.1875, 43.90625, 45.625, 47.34375, 49.0625, 50.78125, 52.5, 54.21875]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 8.0, 14.0, 24.0, 38.0, 64.0, 113.0, 136.0, 149.0, 166.0, 103.0, 83.0, 47.0, 32.0, 16.0, 9.0, 4.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.8138370513916, -28.0267391204834, -27.239639282226562, -26.45254135131836, -25.665443420410156, -24.878345489501953, -24.091245651245117, -23.304147720336914, -22.517047882080078, -21.729949951171875, -20.94285011291504, -20.155752182006836, -19.368654251098633, -18.581554412841797, -17.794456481933594, -17.00735855102539, -16.220260620117188, -15.433161735534668, -14.646063804626465, -13.858964920043945, -13.071866989135742, -12.284768104553223, -11.497669219970703, -10.7105712890625, -9.92347240447998, -9.136373519897461, -8.349275588989258, -7.562176704406738, -6.775078296661377, -5.987979888916016, -5.200881004333496, -4.413782596588135, -3.6266841888427734, -2.839585781097412, -2.0524871349334717, -1.2653884887695312, -0.4782900810241699, 0.3088083267211914, 1.095907211303711, 1.8830056190490723, 2.6701040267944336, 3.457202434539795, 4.244300842285156, 5.031399726867676, 5.818498134613037, 6.605596542358398, 7.392695426940918, 8.179794311523438, 8.96689224243164, 9.75399112701416, 10.541089057922363, 11.328187942504883, 12.115285873413086, 12.902384757995605, 13.689483642578125, 14.476581573486328, 15.263680458068848, 16.050779342651367, 16.83787727355957, 17.624977111816406, 18.41207504272461, 19.199172973632812, 19.986270904541016, 20.77337074279785, 21.560468673706055]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 8.0, 8.0, 11.0, 8.0, 8.0, 10.0, 6.0, 12.0, 14.0, 16.0, 19.0, 22.0, 21.0, 29.0, 24.0, 34.0, 25.0, 30.0, 34.0, 24.0, 34.0, 36.0, 34.0, 35.0, 27.0, 36.0, 41.0, 34.0, 29.0, 30.0, 33.0, 23.0, 27.0, 27.0, 13.0, 26.0, 18.0, 22.0, 14.0, 22.0, 15.0, 13.0, 8.0, 8.0, 6.0, 5.0, 7.0, 5.0, 4.0, 1.0, 3.0, 4.0, 1.0, 3.0, 2.0, 2.0], "bins": [-47.50079345703125, -46.00641632080078, -44.51204299926758, -43.017669677734375, -41.523292541503906, -40.02891540527344, -38.534542083740234, -37.04016876220703, -35.54579162597656, -34.051414489746094, -32.55704116821289, -31.062665939331055, -29.56829071044922, -28.073915481567383, -26.579540252685547, -25.08516502380371, -23.590789794921875, -22.09641456604004, -20.602039337158203, -19.107664108276367, -17.61328887939453, -16.118913650512695, -14.62453842163086, -13.130163192749023, -11.635787963867188, -10.141412734985352, -8.647037506103516, -7.15266227722168, -5.658287048339844, -4.163911819458008, -2.669536590576172, -1.175161361694336, 0.3192138671875, 1.813589096069336, 3.307964324951172, 4.802339553833008, 6.296714782714844, 7.79109001159668, 9.285465240478516, 10.779840469360352, 12.274215698242188, 13.768590927124023, 15.26296615600586, 16.757341384887695, 18.25171661376953, 19.746091842651367, 21.240467071533203, 22.73484230041504, 24.229217529296875, 25.72359275817871, 27.217967987060547, 28.712343215942383, 30.20671844482422, 31.701093673706055, 33.19546890258789, 34.689842224121094, 36.18421936035156, 37.67859649658203, 39.172969818115234, 40.66734313964844, 42.161720275878906, 43.656097412109375, 45.15047073364258, 46.64484405517578, 48.13922119140625]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 2.0, 1.0, 3.0, 8.0, 6.0, 7.0, 8.0, 12.0, 14.0, 13.0, 21.0, 14.0, 17.0, 27.0, 19.0, 25.0, 23.0, 26.0, 28.0, 46.0, 41.0, 42.0, 45.0, 48.0, 38.0, 50.0, 37.0, 38.0, 30.0, 32.0, 31.0, 28.0, 30.0, 25.0, 26.0, 22.0, 22.0, 16.0, 19.0, 7.0, 16.0, 9.0, 5.0, 5.0, 8.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 4.0, 2.0], "bins": [-7.4375, -7.214599609375, -6.99169921875, -6.768798828125, -6.5458984375, -6.322998046875, -6.10009765625, -5.877197265625, -5.654296875, -5.431396484375, -5.20849609375, -4.985595703125, -4.7626953125, -4.539794921875, -4.31689453125, -4.093994140625, -3.87109375, -3.648193359375, -3.42529296875, -3.202392578125, -2.9794921875, -2.756591796875, -2.53369140625, -2.310791015625, -2.087890625, -1.864990234375, -1.64208984375, -1.419189453125, -1.1962890625, -0.973388671875, -0.75048828125, -0.527587890625, -0.3046875, -0.081787109375, 0.14111328125, 0.364013671875, 0.5869140625, 0.809814453125, 1.03271484375, 1.255615234375, 1.478515625, 1.701416015625, 1.92431640625, 2.147216796875, 2.3701171875, 2.593017578125, 2.81591796875, 3.038818359375, 3.26171875, 3.484619140625, 3.70751953125, 3.930419921875, 4.1533203125, 4.376220703125, 4.59912109375, 4.822021484375, 5.044921875, 5.267822265625, 5.49072265625, 5.713623046875, 5.9365234375, 6.159423828125, 6.38232421875, 6.605224609375, 6.828125]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 11.0, 6.0, 7.0, 7.0, 12.0, 16.0, 15.0, 23.0, 23.0, 33.0, 60.0, 88.0, 175.0, 381.0, 860.0, 2049.0, 5765.0, 18413.0, 98842.0, 1260143.0, 2498718.0, 261025.0, 33046.0, 8837.0, 3244.0, 1261.0, 538.0, 274.0, 126.0, 66.0, 40.0, 35.0, 24.0, 29.0, 17.0, 17.0, 11.0, 6.0, 8.0, 6.0, 7.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.1875, -16.618408203125, -16.04931640625, -15.480224609375, -14.9111328125, -14.342041015625, -13.77294921875, -13.203857421875, -12.634765625, -12.065673828125, -11.49658203125, -10.927490234375, -10.3583984375, -9.789306640625, -9.22021484375, -8.651123046875, -8.08203125, -7.512939453125, -6.94384765625, -6.374755859375, -5.8056640625, -5.236572265625, -4.66748046875, -4.098388671875, -3.529296875, -2.960205078125, -2.39111328125, -1.822021484375, -1.2529296875, -0.683837890625, -0.11474609375, 0.454345703125, 1.0234375, 1.592529296875, 2.16162109375, 2.730712890625, 3.2998046875, 3.868896484375, 4.43798828125, 5.007080078125, 5.576171875, 6.145263671875, 6.71435546875, 7.283447265625, 7.8525390625, 8.421630859375, 8.99072265625, 9.559814453125, 10.12890625, 10.697998046875, 11.26708984375, 11.836181640625, 12.4052734375, 12.974365234375, 13.54345703125, 14.112548828125, 14.681640625, 15.250732421875, 15.81982421875, 16.388916015625, 16.9580078125, 17.527099609375, 18.09619140625, 18.665283203125, 19.234375]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 6.0, 9.0, 7.0, 9.0, 14.0, 26.0, 24.0, 27.0, 28.0, 56.0, 72.0, 80.0, 108.0, 137.0, 217.0, 293.0, 365.0, 440.0, 484.0, 435.0, 323.0, 222.0, 176.0, 132.0, 101.0, 76.0, 65.0, 40.0, 26.0, 19.0, 10.0, 16.0, 11.0, 10.0, 2.0, 5.0, 3.0, 4.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.8671875, -11.48779296875, -11.1083984375, -10.72900390625, -10.349609375, -9.97021484375, -9.5908203125, -9.21142578125, -8.83203125, -8.45263671875, -8.0732421875, -7.69384765625, -7.314453125, -6.93505859375, -6.5556640625, -6.17626953125, -5.796875, -5.41748046875, -5.0380859375, -4.65869140625, -4.279296875, -3.89990234375, -3.5205078125, -3.14111328125, -2.76171875, -2.38232421875, -2.0029296875, -1.62353515625, -1.244140625, -0.86474609375, -0.4853515625, -0.10595703125, 0.2734375, 0.65283203125, 1.0322265625, 1.41162109375, 1.791015625, 2.17041015625, 2.5498046875, 2.92919921875, 3.30859375, 3.68798828125, 4.0673828125, 4.44677734375, 4.826171875, 5.20556640625, 5.5849609375, 5.96435546875, 6.34375, 6.72314453125, 7.1025390625, 7.48193359375, 7.861328125, 8.24072265625, 8.6201171875, 8.99951171875, 9.37890625, 9.75830078125, 10.1376953125, 10.51708984375, 10.896484375, 11.27587890625, 11.6552734375, 12.03466796875, 12.4140625]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 11.0, 5.0, 6.0, 10.0, 14.0, 20.0, 29.0, 33.0, 56.0, 57.0, 81.0, 87.0, 142.0, 219.0, 375.0, 776.0, 2893.0, 23831.0, 688139.0, 3395488.0, 73070.0, 6282.0, 1250.0, 477.0, 249.0, 173.0, 127.0, 89.0, 79.0, 49.0, 42.0, 25.0, 27.0, 19.0, 14.0, 12.0, 5.0, 6.0, 3.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0], "bins": [-48.5, -47.23046875, -45.9609375, -44.69140625, -43.421875, -42.15234375, -40.8828125, -39.61328125, -38.34375, -37.07421875, -35.8046875, -34.53515625, -33.265625, -31.99609375, -30.7265625, -29.45703125, -28.1875, -26.91796875, -25.6484375, -24.37890625, -23.109375, -21.83984375, -20.5703125, -19.30078125, -18.03125, -16.76171875, -15.4921875, -14.22265625, -12.953125, -11.68359375, -10.4140625, -9.14453125, -7.875, -6.60546875, -5.3359375, -4.06640625, -2.796875, -1.52734375, -0.2578125, 1.01171875, 2.28125, 3.55078125, 4.8203125, 6.08984375, 7.359375, 8.62890625, 9.8984375, 11.16796875, 12.4375, 13.70703125, 14.9765625, 16.24609375, 17.515625, 18.78515625, 20.0546875, 21.32421875, 22.59375, 23.86328125, 25.1328125, 26.40234375, 27.671875, 28.94140625, 30.2109375, 31.48046875, 32.75]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 10.0, 15.0, 29.0, 37.0, 75.0, 138.0, 190.0, 196.0, 134.0, 80.0, 59.0, 26.0, 8.0, 9.0, 1.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-105.93444061279297, -103.53251647949219, -101.13058471679688, -98.7286605834961, -96.32673645019531, -93.9248046875, -91.52288055419922, -89.12095642089844, -86.71902465820312, -84.31710052490234, -81.91516876220703, -79.51324462890625, -77.11131286621094, -74.70938873291016, -72.30746459960938, -69.90553283691406, -67.50360870361328, -65.1016845703125, -62.69975280761719, -60.297828674316406, -57.89590072631836, -55.49397277832031, -53.09204864501953, -50.690120697021484, -48.28819274902344, -45.88626480102539, -43.484336853027344, -41.08241271972656, -38.680484771728516, -36.27855682373047, -33.87663269042969, -31.47470474243164, -29.072784423828125, -26.670856475830078, -24.268930435180664, -21.86700439453125, -19.465076446533203, -17.063148498535156, -14.661222457885742, -12.259296417236328, -9.857368469238281, -7.455441474914551, -5.05351448059082, -2.65158748626709, -0.24966049194335938, 2.152266502380371, 4.554193496704102, 6.956119537353516, 9.358047485351562, 11.759974479675293, 14.161901473999023, 16.563827514648438, 18.965755462646484, 21.36768341064453, 23.769609451293945, 26.17153549194336, 28.573463439941406, 30.975391387939453, 33.3773193359375, 35.77924346923828, 38.18117141723633, 40.583099365234375, 42.985023498535156, 45.3869514465332, 47.78887939453125]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 2.0, 3.0, 2.0, 3.0, 6.0, 5.0, 5.0, 10.0, 6.0, 20.0, 17.0, 18.0, 24.0, 16.0, 31.0, 33.0, 31.0, 32.0, 32.0, 41.0, 40.0, 42.0, 38.0, 46.0, 35.0, 40.0, 56.0, 52.0, 35.0, 42.0, 32.0, 33.0, 25.0, 16.0, 19.0, 23.0, 21.0, 13.0, 13.0, 6.0, 9.0, 7.0, 5.0, 3.0, 10.0, 2.0, 7.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-46.097259521484375, -44.75735092163086, -43.41743850708008, -42.07752990722656, -40.73761749267578, -39.397708892822266, -38.05780029296875, -36.71788787841797, -35.37797546386719, -34.03806686401367, -32.69815444946289, -31.358245849609375, -30.018333435058594, -28.678424835205078, -27.33851432800293, -25.99860382080078, -24.658695220947266, -23.318784713745117, -21.97887420654297, -20.638965606689453, -19.299053192138672, -17.959144592285156, -16.619234085083008, -15.27932357788086, -13.939413070678711, -12.599502563476562, -11.259592056274414, -9.919682502746582, -8.579771995544434, -7.239861488342285, -5.899951934814453, -4.560041427612305, -3.2201309204101562, -1.880220651626587, -0.5403103828430176, 0.7995996475219727, 2.139510154724121, 3.4794206619262695, 4.819330215454102, 6.15924072265625, 7.499151229858398, 8.839061737060547, 10.178972244262695, 11.518881797790527, 12.858792304992676, 14.198702812194824, 15.538612365722656, 16.878522872924805, 18.218433380126953, 19.5583438873291, 20.89825439453125, 22.238162994384766, 23.578075408935547, 24.917984008789062, 26.25789451599121, 27.59780502319336, 28.937715530395508, 30.277626037597656, 31.617536544799805, 32.95744705200195, 34.29735565185547, 35.63726806640625, 36.977176666259766, 38.31708526611328, 39.65699768066406]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 6.0, 4.0, 2.0, 7.0, 3.0, 8.0, 15.0, 15.0, 15.0, 14.0, 17.0, 13.0, 19.0, 22.0, 26.0, 24.0, 24.0, 38.0, 33.0, 35.0, 38.0, 40.0, 39.0, 41.0, 32.0, 38.0, 34.0, 42.0, 44.0, 37.0, 35.0, 32.0, 34.0, 28.0, 14.0, 17.0, 27.0, 20.0, 15.0, 12.0, 11.0, 4.0, 11.0, 5.0, 5.0, 5.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-7.35546875, -7.12518310546875, -6.8948974609375, -6.66461181640625, -6.434326171875, -6.20404052734375, -5.9737548828125, -5.74346923828125, -5.51318359375, -5.28289794921875, -5.0526123046875, -4.82232666015625, -4.592041015625, -4.36175537109375, -4.1314697265625, -3.90118408203125, -3.6708984375, -3.44061279296875, -3.2103271484375, -2.98004150390625, -2.749755859375, -2.51947021484375, -2.2891845703125, -2.05889892578125, -1.82861328125, -1.59832763671875, -1.3680419921875, -1.13775634765625, -0.907470703125, -0.67718505859375, -0.4468994140625, -0.21661376953125, 0.013671875, 0.24395751953125, 0.4742431640625, 0.70452880859375, 0.934814453125, 1.16510009765625, 1.3953857421875, 1.62567138671875, 1.85595703125, 2.08624267578125, 2.3165283203125, 2.54681396484375, 2.777099609375, 3.00738525390625, 3.2376708984375, 3.46795654296875, 3.6982421875, 3.92852783203125, 4.1588134765625, 4.38909912109375, 4.619384765625, 4.84967041015625, 5.0799560546875, 5.31024169921875, 5.54052734375, 5.77081298828125, 6.0010986328125, 6.23138427734375, 6.461669921875, 6.69195556640625, 6.9222412109375, 7.15252685546875, 7.3828125]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 1.0, 4.0, 4.0, 8.0, 13.0, 24.0, 27.0, 43.0, 71.0, 96.0, 125.0, 216.0, 306.0, 429.0, 621.0, 903.0, 1327.0, 1927.0, 2816.0, 4178.0, 5926.0, 8857.0, 12667.0, 19026.0, 27304.0, 40205.0, 58832.0, 85279.0, 118523.0, 148898.0, 144507.0, 112765.0, 80016.0, 54784.0, 37284.0, 25655.0, 17344.0, 11671.0, 8192.0, 5649.0, 3821.0, 2566.0, 1770.0, 1236.0, 793.0, 600.0, 385.0, 273.0, 178.0, 136.0, 86.0, 68.0, 43.0, 35.0, 21.0, 14.0, 6.0, 5.0, 5.0, 4.0, 2.0], "bins": [-0.63134765625, -0.6121597290039062, -0.5929718017578125, -0.5737838745117188, -0.554595947265625, -0.5354080200195312, -0.5162200927734375, -0.49703216552734375, -0.47784423828125, -0.45865631103515625, -0.4394683837890625, -0.42028045654296875, -0.401092529296875, -0.38190460205078125, -0.3627166748046875, -0.34352874755859375, -0.3243408203125, -0.30515289306640625, -0.2859649658203125, -0.26677703857421875, -0.247589111328125, -0.22840118408203125, -0.2092132568359375, -0.19002532958984375, -0.17083740234375, -0.15164947509765625, -0.1324615478515625, -0.11327362060546875, -0.094085693359375, -0.07489776611328125, -0.0557098388671875, -0.03652191162109375, -0.017333984375, 0.00185394287109375, 0.0210418701171875, 0.04022979736328125, 0.059417724609375, 0.07860565185546875, 0.0977935791015625, 0.11698150634765625, 0.13616943359375, 0.15535736083984375, 0.1745452880859375, 0.19373321533203125, 0.212921142578125, 0.23210906982421875, 0.2512969970703125, 0.27048492431640625, 0.2896728515625, 0.30886077880859375, 0.3280487060546875, 0.34723663330078125, 0.366424560546875, 0.38561248779296875, 0.4048004150390625, 0.42398834228515625, 0.44317626953125, 0.46236419677734375, 0.4815521240234375, 0.5007400512695312, 0.519927978515625, 0.5391159057617188, 0.5583038330078125, 0.5774917602539062, 0.5966796875]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 5.0, 7.0, 5.0, 7.0, 7.0, 10.0, 16.0, 18.0, 22.0, 15.0, 25.0, 29.0, 23.0, 20.0, 29.0, 28.0, 46.0, 38.0, 45.0, 36.0, 33.0, 32.0, 1055.0, 39.0, 46.0, 46.0, 30.0, 25.0, 43.0, 26.0, 22.0, 25.0, 27.0, 21.0, 28.0, 17.0, 13.0, 15.0, 13.0, 11.0, 4.0, 10.0, 5.0, 8.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.8359375, -4.68878173828125, -4.5416259765625, -4.39447021484375, -4.247314453125, -4.10015869140625, -3.9530029296875, -3.80584716796875, -3.65869140625, -3.51153564453125, -3.3643798828125, -3.21722412109375, -3.070068359375, -2.92291259765625, -2.7757568359375, -2.62860107421875, -2.4814453125, -2.33428955078125, -2.1871337890625, -2.03997802734375, -1.892822265625, -1.74566650390625, -1.5985107421875, -1.45135498046875, -1.30419921875, -1.15704345703125, -1.0098876953125, -0.86273193359375, -0.715576171875, -0.56842041015625, -0.4212646484375, -0.27410888671875, -0.126953125, 0.02020263671875, 0.1673583984375, 0.31451416015625, 0.461669921875, 0.60882568359375, 0.7559814453125, 0.90313720703125, 1.05029296875, 1.19744873046875, 1.3446044921875, 1.49176025390625, 1.638916015625, 1.78607177734375, 1.9332275390625, 2.08038330078125, 2.2275390625, 2.37469482421875, 2.5218505859375, 2.66900634765625, 2.816162109375, 2.96331787109375, 3.1104736328125, 3.25762939453125, 3.40478515625, 3.55194091796875, 3.6990966796875, 3.84625244140625, 3.993408203125, 4.14056396484375, 4.2877197265625, 4.43487548828125, 4.58203125]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 5.0, 5.0, 12.0, 10.0, 11.0, 29.0, 43.0, 41.0, 72.0, 120.0, 193.0, 285.0, 465.0, 714.0, 1186.0, 1803.0, 2966.0, 4363.0, 6714.0, 10379.0, 16068.0, 25077.0, 38331.0, 58337.0, 86205.0, 119207.0, 317434.0, 1025026.0, 121630.0, 87719.0, 60397.0, 39616.0, 25724.0, 16723.0, 10650.0, 6950.0, 4502.0, 2854.0, 1886.0, 1204.0, 764.0, 510.0, 336.0, 212.0, 146.0, 79.0, 44.0, 34.0, 23.0, 11.0, 13.0, 6.0, 7.0, 5.0, 1.0, 2.0], "bins": [-0.59814453125, -0.5810699462890625, -0.563995361328125, -0.5469207763671875, -0.52984619140625, -0.5127716064453125, -0.495697021484375, -0.4786224365234375, -0.4615478515625, -0.4444732666015625, -0.427398681640625, -0.4103240966796875, -0.39324951171875, -0.3761749267578125, -0.359100341796875, -0.3420257568359375, -0.324951171875, -0.3078765869140625, -0.290802001953125, -0.2737274169921875, -0.25665283203125, -0.2395782470703125, -0.222503662109375, -0.2054290771484375, -0.1883544921875, -0.1712799072265625, -0.154205322265625, -0.1371307373046875, -0.12005615234375, -0.1029815673828125, -0.085906982421875, -0.0688323974609375, -0.0517578125, -0.0346832275390625, -0.017608642578125, -0.0005340576171875, 0.01654052734375, 0.0336151123046875, 0.050689697265625, 0.0677642822265625, 0.0848388671875, 0.1019134521484375, 0.118988037109375, 0.1360626220703125, 0.15313720703125, 0.1702117919921875, 0.187286376953125, 0.2043609619140625, 0.221435546875, 0.2385101318359375, 0.255584716796875, 0.2726593017578125, 0.28973388671875, 0.3068084716796875, 0.323883056640625, 0.3409576416015625, 0.3580322265625, 0.3751068115234375, 0.392181396484375, 0.4092559814453125, 0.42633056640625, 0.4434051513671875, 0.460479736328125, 0.4775543212890625, 0.49462890625]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 5.0, 8.0, 6.0, 2.0, 10.0, 7.0, 14.0, 13.0, 29.0, 39.0, 39.0, 44.0, 59.0, 80.0, 101.0, 83.0, 86.0, 85.0, 80.0, 50.0, 41.0, 25.0, 28.0, 17.0, 10.0, 9.0, 6.0, 8.0, 7.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.005615234375, -0.00545269250869751, -0.0052901506423950195, -0.005127608776092529, -0.004965066909790039, -0.004802525043487549, -0.004639983177185059, -0.004477441310882568, -0.004314899444580078, -0.004152357578277588, -0.003989815711975098, -0.0038272738456726074, -0.003664731979370117, -0.003502190113067627, -0.0033396482467651367, -0.0031771063804626465, -0.0030145645141601562, -0.002852022647857666, -0.0026894807815551758, -0.0025269389152526855, -0.0023643970489501953, -0.002201855182647705, -0.002039313316345215, -0.0018767714500427246, -0.0017142295837402344, -0.0015516877174377441, -0.001389145851135254, -0.0012266039848327637, -0.0010640621185302734, -0.0009015202522277832, -0.000738978385925293, -0.0005764365196228027, -0.0004138946533203125, -0.00025135278701782227, -8.881092071533203e-05, 7.37309455871582e-05, 0.00023627281188964844, 0.00039881467819213867, 0.0005613565444946289, 0.0007238984107971191, 0.0008864402770996094, 0.0010489821434020996, 0.0012115240097045898, 0.00137406587600708, 0.0015366077423095703, 0.0016991496086120605, 0.0018616914749145508, 0.002024233341217041, 0.0021867752075195312, 0.0023493170738220215, 0.0025118589401245117, 0.002674400806427002, 0.002836942672729492, 0.0029994845390319824, 0.0031620264053344727, 0.003324568271636963, 0.003487110137939453, 0.0036496520042419434, 0.0038121938705444336, 0.003974735736846924, 0.004137277603149414, 0.004299819469451904, 0.0044623613357543945, 0.004624903202056885, 0.004787445068359375]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0, 3.0, 4.0, 2.0, 9.0, 8.0, 8.0, 10.0, 15.0, 28.0, 33.0, 50.0, 73.0, 112.0, 167.0, 338.0, 872.0, 164677.0, 879786.0, 1361.0, 372.0, 207.0, 122.0, 86.0, 59.0, 37.0, 22.0, 29.0, 9.0, 17.0, 7.0, 8.0, 7.0, 5.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.096435546875, -0.09300422668457031, -0.08957290649414062, -0.08614158630371094, -0.08271026611328125, -0.07927894592285156, -0.07584762573242188, -0.07241630554199219, -0.0689849853515625, -0.06555366516113281, -0.062122344970703125, -0.05869102478027344, -0.05525970458984375, -0.05182838439941406, -0.048397064208984375, -0.04496574401855469, -0.041534423828125, -0.03810310363769531, -0.034671783447265625, -0.031240463256835938, -0.02780914306640625, -0.024377822875976562, -0.020946502685546875, -0.017515182495117188, -0.0140838623046875, -0.010652542114257812, -0.007221221923828125, -0.0037899017333984375, -0.00035858154296875, 0.0030727386474609375, 0.006504058837890625, 0.009935379028320312, 0.01336669921875, 0.016798019409179688, 0.020229339599609375, 0.023660659790039062, 0.02709197998046875, 0.030523300170898438, 0.033954620361328125, 0.03738594055175781, 0.0408172607421875, 0.04424858093261719, 0.047679901123046875, 0.05111122131347656, 0.05454254150390625, 0.05797386169433594, 0.061405181884765625, 0.06483650207519531, 0.068267822265625, 0.07169914245605469, 0.07513046264648438, 0.07856178283691406, 0.08199310302734375, 0.08542442321777344, 0.08885574340820312, 0.09228706359863281, 0.0957183837890625, 0.09914970397949219, 0.10258102416992188, 0.10601234436035156, 0.10944366455078125, 0.11287498474121094, 0.11630630493164062, 0.11973762512207031, 0.1231689453125]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 9.0, 129.0, 702.0, 170.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.012886013835668564, -0.012287216261029243, -0.011688417755067348, -0.011089619249105453, -0.010490821674466133, -0.009892024099826813, -0.009293225593864918, -0.008694427087903023, -0.008095629513263702, -0.007496831472963095, -0.006898033432662487, -0.006299235392361879, -0.005700437352061272, -0.005101639311760664, -0.004502841271460056, -0.0039040432311594486, -0.003305245190858841, -0.0027064471505582333, -0.0021076491102576256, -0.001508851069957018, -0.0009100530296564102, -0.00031125498935580254, 0.00028754305094480515, 0.0008863410912454128, 0.0014851391315460205, 0.002083937171846628, 0.002682735212147236, 0.0032815332524478436, 0.0038803312927484512, 0.004479129333049059, 0.005077927373349667, 0.005676725413650274, 0.006275523453950882, 0.00687432149425149, 0.007473119534552097, 0.008071918040513992, 0.008670715615153313, 0.009269513189792633, 0.009868311695754528, 0.010467110201716423, 0.011065907776355743, 0.011664705350995064, 0.012263503856956959, 0.012862302362918854, 0.013461099937558174, 0.014059897512197495, 0.01465869601815939, 0.015257494524121284, 0.015856292098760605, 0.016455089673399925, 0.017053887248039246, 0.017652686685323715, 0.018251484259963036, 0.018850281834602356, 0.019449081271886826, 0.020047878846526146, 0.020646676421165466, 0.021245473995804787, 0.021844271570444107, 0.022443071007728577, 0.023041868582367897, 0.023640666157007217, 0.024239465594291687, 0.024838263168931007, 0.025437060743570328]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 4.0, 7.0, 9.0, 7.0, 6.0, 8.0, 12.0, 16.0, 22.0, 15.0, 15.0, 19.0, 23.0, 29.0, 28.0, 24.0, 28.0, 34.0, 34.0, 36.0, 33.0, 32.0, 42.0, 36.0, 34.0, 39.0, 47.0, 30.0, 33.0, 32.0, 40.0, 38.0, 30.0, 27.0, 24.0, 18.0, 20.0, 22.0, 16.0, 4.0, 7.0, 5.0, 5.0, 4.0, 5.0, 2.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.002066671848297119, -0.002003171481192112, -0.0019396711140871048, -0.0018761707469820976, -0.0018126703798770905, -0.0017491700127720833, -0.0016856696456670761, -0.001622169278562069, -0.0015586689114570618, -0.0014951685443520546, -0.0014316681772470474, -0.0013681678101420403, -0.001304667443037033, -0.001241167075932026, -0.0011776667088270187, -0.0011141663417220116, -0.0010506659746170044, -0.0009871656075119972, -0.00092366524040699, -0.0008601648733019829, -0.0007966645061969757, -0.0007331641390919685, -0.0006696637719869614, -0.0006061634048819542, -0.000542663037776947, -0.00047916267067193985, -0.0004156623035669327, -0.0003521619364619255, -0.00028866156935691833, -0.00022516120225191116, -0.000161660835146904, -9.816046804189682e-05, -3.466010093688965e-05, 2.8840266168117523e-05, 9.23406332731247e-05, 0.00015584100037813187, 0.00021934136748313904, 0.0002828417345881462, 0.0003463421016931534, 0.00040984246879816055, 0.0004733428359031677, 0.0005368432030081749, 0.0006003435701131821, 0.0006638439372181892, 0.0007273443043231964, 0.0007908446714282036, 0.0008543450385332108, 0.0009178454056382179, 0.000981345772743225, 0.0010448461398482323, 0.0011083465069532394, 0.0011718468740582466, 0.0012353472411632538, 0.001298847608268261, 0.0013623479753732681, 0.0014258483424782753, 0.0014893487095832825, 0.0015528490766882896, 0.0016163494437932968, 0.001679849810898304, 0.0017433501780033112, 0.0018068505451083183, 0.0018703509122133255, 0.0019338512793183327, 0.00199735164642334]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 6.0, 4.0, 2.0, 7.0, 3.0, 7.0, 16.0, 15.0, 15.0, 14.0, 17.0, 13.0, 19.0, 22.0, 26.0, 24.0, 24.0, 38.0, 32.0, 36.0, 37.0, 40.0, 40.0, 41.0, 32.0, 38.0, 33.0, 43.0, 44.0, 37.0, 35.0, 32.0, 34.0, 28.0, 14.0, 17.0, 27.0, 20.0, 15.0, 12.0, 10.0, 5.0, 11.0, 5.0, 5.0, 5.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-7.359375, -7.1290283203125, -6.898681640625, -6.6683349609375, -6.43798828125, -6.2076416015625, -5.977294921875, -5.7469482421875, -5.5166015625, -5.2862548828125, -5.055908203125, -4.8255615234375, -4.59521484375, -4.3648681640625, -4.134521484375, -3.9041748046875, -3.673828125, -3.4434814453125, -3.213134765625, -2.9827880859375, -2.75244140625, -2.5220947265625, -2.291748046875, -2.0614013671875, -1.8310546875, -1.6007080078125, -1.370361328125, -1.1400146484375, -0.90966796875, -0.6793212890625, -0.448974609375, -0.2186279296875, 0.01171875, 0.2420654296875, 0.472412109375, 0.7027587890625, 0.93310546875, 1.1634521484375, 1.393798828125, 1.6241455078125, 1.8544921875, 2.0848388671875, 2.315185546875, 2.5455322265625, 2.77587890625, 3.0062255859375, 3.236572265625, 3.4669189453125, 3.697265625, 3.9276123046875, 4.157958984375, 4.3883056640625, 4.61865234375, 4.8489990234375, 5.079345703125, 5.3096923828125, 5.5400390625, 5.7703857421875, 6.000732421875, 6.2310791015625, 6.46142578125, 6.6917724609375, 6.922119140625, 7.1524658203125, 7.3828125]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 2.0, 10.0, 7.0, 8.0, 14.0, 8.0, 13.0, 26.0, 31.0, 40.0, 39.0, 65.0, 58.0, 81.0, 110.0, 172.0, 216.0, 288.0, 411.0, 547.0, 1196.0, 2805.0, 9197.0, 36095.0, 505895.0, 441567.0, 34762.0, 8871.0, 2699.0, 1095.0, 584.0, 402.0, 293.0, 254.0, 156.0, 126.0, 101.0, 84.0, 58.0, 36.0, 34.0, 23.0, 18.0, 14.0, 14.0, 6.0, 10.0, 5.0, 2.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-18.515625, -17.936767578125, -17.35791015625, -16.779052734375, -16.2001953125, -15.621337890625, -15.04248046875, -14.463623046875, -13.884765625, -13.305908203125, -12.72705078125, -12.148193359375, -11.5693359375, -10.990478515625, -10.41162109375, -9.832763671875, -9.25390625, -8.675048828125, -8.09619140625, -7.517333984375, -6.9384765625, -6.359619140625, -5.78076171875, -5.201904296875, -4.623046875, -4.044189453125, -3.46533203125, -2.886474609375, -2.3076171875, -1.728759765625, -1.14990234375, -0.571044921875, 0.0078125, 0.586669921875, 1.16552734375, 1.744384765625, 2.3232421875, 2.902099609375, 3.48095703125, 4.059814453125, 4.638671875, 5.217529296875, 5.79638671875, 6.375244140625, 6.9541015625, 7.532958984375, 8.11181640625, 8.690673828125, 9.26953125, 9.848388671875, 10.42724609375, 11.006103515625, 11.5849609375, 12.163818359375, 12.74267578125, 13.321533203125, 13.900390625, 14.479248046875, 15.05810546875, 15.636962890625, 16.2158203125, 16.794677734375, 17.37353515625, 17.952392578125, 18.53125]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 5.0, 6.0, 8.0, 9.0, 10.0, 13.0, 10.0, 21.0, 19.0, 16.0, 25.0, 29.0, 22.0, 33.0, 37.0, 38.0, 42.0, 47.0, 62.0, 99.0, 1701.0, 273.0, 78.0, 63.0, 41.0, 49.0, 38.0, 29.0, 29.0, 35.0, 23.0, 19.0, 23.0, 15.0, 18.0, 5.0, 8.0, 8.0, 8.0, 4.0, 7.0, 7.0, 6.0, 1.0, 2.0, 1.0, 4.0, 1.0, 4.0, 0.0, 0.0, 1.0], "bins": [-20.390625, -19.768798828125, -19.14697265625, -18.525146484375, -17.9033203125, -17.281494140625, -16.65966796875, -16.037841796875, -15.416015625, -14.794189453125, -14.17236328125, -13.550537109375, -12.9287109375, -12.306884765625, -11.68505859375, -11.063232421875, -10.44140625, -9.819580078125, -9.19775390625, -8.575927734375, -7.9541015625, -7.332275390625, -6.71044921875, -6.088623046875, -5.466796875, -4.844970703125, -4.22314453125, -3.601318359375, -2.9794921875, -2.357666015625, -1.73583984375, -1.114013671875, -0.4921875, 0.129638671875, 0.75146484375, 1.373291015625, 1.9951171875, 2.616943359375, 3.23876953125, 3.860595703125, 4.482421875, 5.104248046875, 5.72607421875, 6.347900390625, 6.9697265625, 7.591552734375, 8.21337890625, 8.835205078125, 9.45703125, 10.078857421875, 10.70068359375, 11.322509765625, 11.9443359375, 12.566162109375, 13.18798828125, 13.809814453125, 14.431640625, 15.053466796875, 15.67529296875, 16.297119140625, 16.9189453125, 17.540771484375, 18.16259765625, 18.784423828125, 19.40625]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 1.0, 5.0, 5.0, 5.0, 6.0, 9.0, 11.0, 10.0, 6.0, 13.0, 19.0, 23.0, 28.0, 22.0, 25.0, 35.0, 51.0, 67.0, 78.0, 128.0, 225.0, 515.0, 3182.0, 113264.0, 3013563.0, 12496.0, 967.0, 317.0, 174.0, 82.0, 65.0, 52.0, 38.0, 33.0, 37.0, 26.0, 22.0, 20.0, 16.0, 19.0, 10.0, 7.0, 8.0, 5.0, 6.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-53.96875, -52.24072265625, -50.5126953125, -48.78466796875, -47.056640625, -45.32861328125, -43.6005859375, -41.87255859375, -40.14453125, -38.41650390625, -36.6884765625, -34.96044921875, -33.232421875, -31.50439453125, -29.7763671875, -28.04833984375, -26.3203125, -24.59228515625, -22.8642578125, -21.13623046875, -19.408203125, -17.68017578125, -15.9521484375, -14.22412109375, -12.49609375, -10.76806640625, -9.0400390625, -7.31201171875, -5.583984375, -3.85595703125, -2.1279296875, -0.39990234375, 1.328125, 3.05615234375, 4.7841796875, 6.51220703125, 8.240234375, 9.96826171875, 11.6962890625, 13.42431640625, 15.15234375, 16.88037109375, 18.6083984375, 20.33642578125, 22.064453125, 23.79248046875, 25.5205078125, 27.24853515625, 28.9765625, 30.70458984375, 32.4326171875, 34.16064453125, 35.888671875, 37.61669921875, 39.3447265625, 41.07275390625, 42.80078125, 44.52880859375, 46.2568359375, 47.98486328125, 49.712890625, 51.44091796875, 53.1689453125, 54.89697265625, 56.625]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 13.0, 66.0, 207.0, 353.0, 258.0, 88.0, 19.0, 7.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-77.25318908691406, -75.3061752319336, -73.35916900634766, -71.41215515136719, -69.46514892578125, -67.51813507080078, -65.57112884521484, -63.624114990234375, -61.67710876464844, -59.730098724365234, -57.78308868408203, -55.83607864379883, -53.889068603515625, -51.94205856323242, -49.99504852294922, -48.04803466796875, -46.10102462768555, -44.154014587402344, -42.20700454711914, -40.25999450683594, -38.312984466552734, -36.36597442626953, -34.41896057128906, -32.471954345703125, -30.52494239807129, -28.577932357788086, -26.630922317504883, -24.683910369873047, -22.736900329589844, -20.78989028930664, -18.842880249023438, -16.895870208740234, -14.948856353759766, -13.001846313476562, -11.05483627319336, -9.10782527923584, -7.160815238952637, -5.213805198669434, -3.266794204711914, -1.319784164428711, 0.6272258758544922, 2.5742361545562744, 4.521246433258057, 6.468256950378418, 8.415266990661621, 10.362277030944824, 12.309288024902344, 14.256298065185547, 16.20330810546875, 18.150318145751953, 20.097328186035156, 22.04433822631836, 23.991348266601562, 25.938358306884766, 27.8853702545166, 29.832380294799805, 31.779390335083008, 33.726402282714844, 35.67341232299805, 37.62042236328125, 39.56743240356445, 41.514442443847656, 43.46145248413086, 45.40846252441406, 47.355472564697266]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 6.0, 8.0, 1.0, 8.0, 7.0, 6.0, 20.0, 14.0, 17.0, 21.0, 26.0, 26.0, 31.0, 41.0, 35.0, 47.0, 37.0, 61.0, 42.0, 47.0, 51.0, 42.0, 32.0, 40.0, 44.0, 44.0, 34.0, 37.0, 37.0, 23.0, 17.0, 15.0, 19.0, 10.0, 19.0, 12.0, 4.0, 5.0, 6.0, 7.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-61.02687072753906, -59.1953239440918, -57.3637809753418, -55.53223419189453, -53.700687408447266, -51.869140625, -50.03759765625, -48.206050872802734, -46.37450408935547, -44.5429573059082, -42.7114143371582, -40.87986755371094, -39.04832077026367, -37.216773986816406, -35.385231018066406, -33.55368423461914, -31.72214126586914, -29.890596389770508, -28.059049606323242, -26.22750473022461, -24.395957946777344, -22.56441307067871, -20.732868194580078, -18.901321411132812, -17.06977653503418, -15.23823070526123, -13.406684875488281, -11.575139999389648, -9.7435941696167, -7.91204833984375, -6.080503463745117, -4.248957633972168, -2.4174118041992188, -0.5858662128448486, 1.2456793785095215, 3.0772247314453125, 4.908770561218262, 6.740316390991211, 8.571861267089844, 10.403407096862793, 12.234952926635742, 14.066498756408691, 15.89804458618164, 17.729589462280273, 19.561134338378906, 21.392681121826172, 23.224225997924805, 25.055770874023438, 26.887317657470703, 28.718862533569336, 30.5504093170166, 32.381954193115234, 34.2135009765625, 36.0450439453125, 37.876590728759766, 39.70813751220703, 41.53968048095703, 43.3712272644043, 45.2027702331543, 47.03431701660156, 48.86586380004883, 50.697410583496094, 52.528953552246094, 54.36050033569336, 56.192047119140625]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 1.0, 4.0, 4.0, 2.0, 8.0, 11.0, 9.0, 12.0, 16.0, 18.0, 16.0, 23.0, 19.0, 22.0, 28.0, 26.0, 20.0, 29.0, 41.0, 34.0, 43.0, 46.0, 39.0, 42.0, 44.0, 34.0, 46.0, 41.0, 38.0, 35.0, 43.0, 34.0, 10.0, 26.0, 24.0, 23.0, 20.0, 17.0, 11.0, 14.0, 7.0, 5.0, 3.0, 4.0, 1.0, 9.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0], "bins": [-7.828125, -7.58636474609375, -7.3446044921875, -7.10284423828125, -6.861083984375, -6.61932373046875, -6.3775634765625, -6.13580322265625, -5.89404296875, -5.65228271484375, -5.4105224609375, -5.16876220703125, -4.927001953125, -4.68524169921875, -4.4434814453125, -4.20172119140625, -3.9599609375, -3.71820068359375, -3.4764404296875, -3.23468017578125, -2.992919921875, -2.75115966796875, -2.5093994140625, -2.26763916015625, -2.02587890625, -1.78411865234375, -1.5423583984375, -1.30059814453125, -1.058837890625, -0.81707763671875, -0.5753173828125, -0.33355712890625, -0.091796875, 0.14996337890625, 0.3917236328125, 0.63348388671875, 0.875244140625, 1.11700439453125, 1.3587646484375, 1.60052490234375, 1.84228515625, 2.08404541015625, 2.3258056640625, 2.56756591796875, 2.809326171875, 3.05108642578125, 3.2928466796875, 3.53460693359375, 3.7763671875, 4.01812744140625, 4.2598876953125, 4.50164794921875, 4.743408203125, 4.98516845703125, 5.2269287109375, 5.46868896484375, 5.71044921875, 5.95220947265625, 6.1939697265625, 6.43572998046875, 6.677490234375, 6.91925048828125, 7.1610107421875, 7.40277099609375, 7.64453125]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 3.0, 4.0, 5.0, 12.0, 10.0, 17.0, 8.0, 16.0, 24.0, 29.0, 44.0, 58.0, 94.0, 104.0, 160.0, 283.0, 433.0, 759.0, 1369.0, 2700.0, 6098.0, 14870.0, 49043.0, 328152.0, 2165501.0, 1399109.0, 172450.0, 32382.0, 10983.0, 4507.0, 2242.0, 1089.0, 643.0, 375.0, 205.0, 145.0, 78.0, 74.0, 52.0, 35.0, 25.0, 22.0, 19.0, 20.0, 13.0, 7.0, 4.0, 2.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0], "bins": [-15.796875, -15.31591796875, -14.8349609375, -14.35400390625, -13.873046875, -13.39208984375, -12.9111328125, -12.43017578125, -11.94921875, -11.46826171875, -10.9873046875, -10.50634765625, -10.025390625, -9.54443359375, -9.0634765625, -8.58251953125, -8.1015625, -7.62060546875, -7.1396484375, -6.65869140625, -6.177734375, -5.69677734375, -5.2158203125, -4.73486328125, -4.25390625, -3.77294921875, -3.2919921875, -2.81103515625, -2.330078125, -1.84912109375, -1.3681640625, -0.88720703125, -0.40625, 0.07470703125, 0.5556640625, 1.03662109375, 1.517578125, 1.99853515625, 2.4794921875, 2.96044921875, 3.44140625, 3.92236328125, 4.4033203125, 4.88427734375, 5.365234375, 5.84619140625, 6.3271484375, 6.80810546875, 7.2890625, 7.77001953125, 8.2509765625, 8.73193359375, 9.212890625, 9.69384765625, 10.1748046875, 10.65576171875, 11.13671875, 11.61767578125, 12.0986328125, 12.57958984375, 13.060546875, 13.54150390625, 14.0224609375, 14.50341796875, 14.984375]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 5.0, 5.0, 13.0, 15.0, 29.0, 34.0, 38.0, 81.0, 100.0, 181.0, 244.0, 377.0, 565.0, 653.0, 601.0, 391.0, 229.0, 157.0, 116.0, 91.0, 50.0, 32.0, 21.0, 20.0, 10.0, 13.0, 7.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-15.671875, -15.139892578125, -14.60791015625, -14.075927734375, -13.5439453125, -13.011962890625, -12.47998046875, -11.947998046875, -11.416015625, -10.884033203125, -10.35205078125, -9.820068359375, -9.2880859375, -8.756103515625, -8.22412109375, -7.692138671875, -7.16015625, -6.628173828125, -6.09619140625, -5.564208984375, -5.0322265625, -4.500244140625, -3.96826171875, -3.436279296875, -2.904296875, -2.372314453125, -1.84033203125, -1.308349609375, -0.7763671875, -0.244384765625, 0.28759765625, 0.819580078125, 1.3515625, 1.883544921875, 2.41552734375, 2.947509765625, 3.4794921875, 4.011474609375, 4.54345703125, 5.075439453125, 5.607421875, 6.139404296875, 6.67138671875, 7.203369140625, 7.7353515625, 8.267333984375, 8.79931640625, 9.331298828125, 9.86328125, 10.395263671875, 10.92724609375, 11.459228515625, 11.9912109375, 12.523193359375, 13.05517578125, 13.587158203125, 14.119140625, 14.651123046875, 15.18310546875, 15.715087890625, 16.2470703125, 16.779052734375, 17.31103515625, 17.843017578125, 18.375]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 8.0, 8.0, 8.0, 14.0, 22.0, 35.0, 59.0, 54.0, 74.0, 135.0, 177.0, 264.0, 528.0, 1547.0, 8580.0, 121150.0, 3734941.0, 307272.0, 15544.0, 2288.0, 683.0, 327.0, 177.0, 130.0, 75.0, 53.0, 32.0, 30.0, 26.0, 15.0, 7.0, 10.0, 7.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.84375, -44.48046875, -43.1171875, -41.75390625, -40.390625, -39.02734375, -37.6640625, -36.30078125, -34.9375, -33.57421875, -32.2109375, -30.84765625, -29.484375, -28.12109375, -26.7578125, -25.39453125, -24.03125, -22.66796875, -21.3046875, -19.94140625, -18.578125, -17.21484375, -15.8515625, -14.48828125, -13.125, -11.76171875, -10.3984375, -9.03515625, -7.671875, -6.30859375, -4.9453125, -3.58203125, -2.21875, -0.85546875, 0.5078125, 1.87109375, 3.234375, 4.59765625, 5.9609375, 7.32421875, 8.6875, 10.05078125, 11.4140625, 12.77734375, 14.140625, 15.50390625, 16.8671875, 18.23046875, 19.59375, 20.95703125, 22.3203125, 23.68359375, 25.046875, 26.41015625, 27.7734375, 29.13671875, 30.5, 31.86328125, 33.2265625, 34.58984375, 35.953125, 37.31640625, 38.6796875, 40.04296875, 41.40625]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 15.0, 67.0, 247.0, 389.0, 209.0, 66.0, 14.0, 1.0, 0.0, 0.0, 1.0], "bins": [-306.80279541015625, -301.35601806640625, -295.90924072265625, -290.46246337890625, -285.01568603515625, -279.56890869140625, -274.12213134765625, -268.67535400390625, -263.22857666015625, -257.78179931640625, -252.33502197265625, -246.88824462890625, -241.44146728515625, -235.9946746826172, -230.5478973388672, -225.1011199951172, -219.65432739257812, -214.20755004882812, -208.76077270507812, -203.31399536132812, -197.86721801757812, -192.42042541503906, -186.97364807128906, -181.52687072753906, -176.08009338378906, -170.63331604003906, -165.18653869628906, -159.73976135253906, -154.29296875, -148.84619140625, -143.3994140625, -137.95263671875, -132.505859375, -127.05908203125, -121.6123046875, -116.16551971435547, -110.71874237060547, -105.27196502685547, -99.82518005371094, -94.37840270996094, -88.9316177368164, -83.4848403930664, -78.03805541992188, -72.59127807617188, -67.14450073242188, -61.697723388671875, -56.25094223022461, -50.804161071777344, -45.357383728027344, -39.910606384277344, -34.46382522583008, -29.017045974731445, -23.570266723632812, -18.12348747253418, -12.676708221435547, -7.229927062988281, -1.7831497192382812, 3.6636295318603516, 9.110408782958984, 14.557188034057617, 20.00396728515625, 25.450746536254883, 30.897525787353516, 36.34430694580078, 41.79108428955078]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 10.0, 8.0, 2.0, 12.0, 7.0, 13.0, 16.0, 20.0, 17.0, 23.0, 18.0, 20.0, 25.0, 27.0, 36.0, 48.0, 35.0, 30.0, 39.0, 34.0, 44.0, 39.0, 42.0, 27.0, 40.0, 30.0, 31.0, 34.0, 27.0, 33.0, 30.0, 25.0, 31.0, 18.0, 16.0, 11.0, 12.0, 17.0, 5.0, 17.0, 5.0, 13.0, 7.0, 4.0, 4.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-38.7432861328125, -37.51582336425781, -36.288360595703125, -35.06089782714844, -33.83343505859375, -32.60597229003906, -31.378511428833008, -30.15104866027832, -28.923585891723633, -27.696123123168945, -26.468660354614258, -25.24119758605957, -24.013736724853516, -22.786273956298828, -21.55881118774414, -20.331348419189453, -19.103885650634766, -17.876422882080078, -16.64896011352539, -15.42149829864502, -14.194035530090332, -12.966572761535645, -11.739110946655273, -10.511648178100586, -9.284185409545898, -8.056722640991211, -6.829260349273682, -5.601798057556152, -4.374335289001465, -3.1468725204467773, -1.919410228729248, -0.6919479370117188, 0.5355148315429688, 1.7629773616790771, 2.9904398918151855, 4.217902183532715, 5.445364952087402, 6.67282772064209, 7.900290012359619, 9.127752304077148, 10.355215072631836, 11.582677841186523, 12.810140609741211, 14.037602424621582, 15.26506519317627, 16.49252700805664, 17.719989776611328, 18.947452545166016, 20.174915313720703, 21.40237808227539, 22.629840850830078, 23.857303619384766, 25.084766387939453, 26.31222915649414, 27.539690017700195, 28.767152786254883, 29.99461555480957, 31.222078323364258, 32.44953918457031, 33.677001953125, 34.90446472167969, 36.131927490234375, 37.35939025878906, 38.58685302734375, 39.81431579589844]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 5.0, 3.0, 8.0, 5.0, 16.0, 11.0, 8.0, 12.0, 18.0, 14.0, 17.0, 21.0, 32.0, 27.0, 40.0, 29.0, 41.0, 38.0, 33.0, 34.0, 40.0, 30.0, 41.0, 51.0, 42.0, 44.0, 27.0, 47.0, 26.0, 30.0, 30.0, 23.0, 15.0, 22.0, 20.0, 23.0, 12.0, 9.0, 10.0, 11.0, 9.0, 6.0, 4.0, 8.0, 2.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-8.6328125, -8.37945556640625, -8.1260986328125, -7.87274169921875, -7.619384765625, -7.36602783203125, -7.1126708984375, -6.85931396484375, -6.60595703125, -6.35260009765625, -6.0992431640625, -5.84588623046875, -5.592529296875, -5.33917236328125, -5.0858154296875, -4.83245849609375, -4.5791015625, -4.32574462890625, -4.0723876953125, -3.81903076171875, -3.565673828125, -3.31231689453125, -3.0589599609375, -2.80560302734375, -2.55224609375, -2.29888916015625, -2.0455322265625, -1.79217529296875, -1.538818359375, -1.28546142578125, -1.0321044921875, -0.77874755859375, -0.525390625, -0.27203369140625, -0.0186767578125, 0.23468017578125, 0.488037109375, 0.74139404296875, 0.9947509765625, 1.24810791015625, 1.50146484375, 1.75482177734375, 2.0081787109375, 2.26153564453125, 2.514892578125, 2.76824951171875, 3.0216064453125, 3.27496337890625, 3.5283203125, 3.78167724609375, 4.0350341796875, 4.28839111328125, 4.541748046875, 4.79510498046875, 5.0484619140625, 5.30181884765625, 5.55517578125, 5.80853271484375, 6.0618896484375, 6.31524658203125, 6.568603515625, 6.82196044921875, 7.0753173828125, 7.32867431640625, 7.58203125]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 2.0, 9.0, 15.0, 26.0, 45.0, 58.0, 78.0, 123.0, 201.0, 297.0, 462.0, 714.0, 1127.0, 1764.0, 2649.0, 4109.0, 6392.0, 9966.0, 15626.0, 24178.0, 37751.0, 58858.0, 89771.0, 130651.0, 166749.0, 158209.0, 117265.0, 78659.0, 51227.0, 32562.0, 21060.0, 13167.0, 8845.0, 5528.0, 3688.0, 2421.0, 1538.0, 967.0, 653.0, 394.0, 248.0, 188.0, 114.0, 79.0, 45.0, 26.0, 24.0, 6.0, 10.0, 5.0, 3.0, 3.0, 1.0, 1.0, 3.0, 1.0], "bins": [-0.7431640625, -0.7205352783203125, -0.697906494140625, -0.6752777099609375, -0.65264892578125, -0.6300201416015625, -0.607391357421875, -0.5847625732421875, -0.5621337890625, -0.5395050048828125, -0.516876220703125, -0.4942474365234375, -0.47161865234375, -0.4489898681640625, -0.426361083984375, -0.4037322998046875, -0.381103515625, -0.3584747314453125, -0.335845947265625, -0.3132171630859375, -0.29058837890625, -0.2679595947265625, -0.245330810546875, -0.2227020263671875, -0.2000732421875, -0.1774444580078125, -0.154815673828125, -0.1321868896484375, -0.10955810546875, -0.0869293212890625, -0.064300537109375, -0.0416717529296875, -0.01904296875, 0.0035858154296875, 0.026214599609375, 0.0488433837890625, 0.07147216796875, 0.0941009521484375, 0.116729736328125, 0.1393585205078125, 0.1619873046875, 0.1846160888671875, 0.207244873046875, 0.2298736572265625, 0.25250244140625, 0.2751312255859375, 0.297760009765625, 0.3203887939453125, 0.343017578125, 0.3656463623046875, 0.388275146484375, 0.4109039306640625, 0.43353271484375, 0.4561614990234375, 0.478790283203125, 0.5014190673828125, 0.5240478515625, 0.5466766357421875, 0.569305419921875, 0.5919342041015625, 0.61456298828125, 0.6371917724609375, 0.659820556640625, 0.6824493408203125, 0.705078125]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 7.0, 2.0, 4.0, 1.0, 4.0, 4.0, 6.0, 7.0, 6.0, 7.0, 13.0, 9.0, 13.0, 21.0, 22.0, 23.0, 25.0, 30.0, 26.0, 34.0, 38.0, 39.0, 46.0, 47.0, 43.0, 45.0, 1052.0, 31.0, 41.0, 31.0, 33.0, 35.0, 47.0, 36.0, 26.0, 33.0, 22.0, 19.0, 20.0, 22.0, 16.0, 5.0, 10.0, 8.0, 7.0, 6.0, 4.0, 2.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.08984375, -4.92645263671875, -4.7630615234375, -4.59967041015625, -4.436279296875, -4.27288818359375, -4.1094970703125, -3.94610595703125, -3.78271484375, -3.61932373046875, -3.4559326171875, -3.29254150390625, -3.129150390625, -2.96575927734375, -2.8023681640625, -2.63897705078125, -2.4755859375, -2.31219482421875, -2.1488037109375, -1.98541259765625, -1.822021484375, -1.65863037109375, -1.4952392578125, -1.33184814453125, -1.16845703125, -1.00506591796875, -0.8416748046875, -0.67828369140625, -0.514892578125, -0.35150146484375, -0.1881103515625, -0.02471923828125, 0.138671875, 0.30206298828125, 0.4654541015625, 0.62884521484375, 0.792236328125, 0.95562744140625, 1.1190185546875, 1.28240966796875, 1.44580078125, 1.60919189453125, 1.7725830078125, 1.93597412109375, 2.099365234375, 2.26275634765625, 2.4261474609375, 2.58953857421875, 2.7529296875, 2.91632080078125, 3.0797119140625, 3.24310302734375, 3.406494140625, 3.56988525390625, 3.7332763671875, 3.89666748046875, 4.06005859375, 4.22344970703125, 4.3868408203125, 4.55023193359375, 4.713623046875, 4.87701416015625, 5.0404052734375, 5.20379638671875, 5.3671875]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 2.0, 5.0, 9.0, 13.0, 18.0, 35.0, 50.0, 75.0, 116.0, 186.0, 310.0, 522.0, 791.0, 1247.0, 1966.0, 3072.0, 4876.0, 7759.0, 12293.0, 19653.0, 30545.0, 48623.0, 74060.0, 109091.0, 145952.0, 1209332.0, 138691.0, 101158.0, 67319.0, 43447.0, 27722.0, 17804.0, 11105.0, 7083.0, 4377.0, 2895.0, 1831.0, 1149.0, 702.0, 469.0, 290.0, 171.0, 123.0, 78.0, 48.0, 27.0, 15.0, 9.0, 9.0, 5.0, 1.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.63330078125, -0.6137466430664062, -0.5941925048828125, -0.5746383666992188, -0.555084228515625, -0.5355300903320312, -0.5159759521484375, -0.49642181396484375, -0.47686767578125, -0.45731353759765625, -0.4377593994140625, -0.41820526123046875, -0.398651123046875, -0.37909698486328125, -0.3595428466796875, -0.33998870849609375, -0.3204345703125, -0.30088043212890625, -0.2813262939453125, -0.26177215576171875, -0.242218017578125, -0.22266387939453125, -0.2031097412109375, -0.18355560302734375, -0.16400146484375, -0.14444732666015625, -0.1248931884765625, -0.10533905029296875, -0.085784912109375, -0.06623077392578125, -0.0466766357421875, -0.02712249755859375, -0.007568359375, 0.01198577880859375, 0.0315399169921875, 0.05109405517578125, 0.070648193359375, 0.09020233154296875, 0.1097564697265625, 0.12931060791015625, 0.14886474609375, 0.16841888427734375, 0.1879730224609375, 0.20752716064453125, 0.227081298828125, 0.24663543701171875, 0.2661895751953125, 0.28574371337890625, 0.3052978515625, 0.32485198974609375, 0.3444061279296875, 0.36396026611328125, 0.383514404296875, 0.40306854248046875, 0.4226226806640625, 0.44217681884765625, 0.46173095703125, 0.48128509521484375, 0.5008392333984375, 0.5203933715820312, 0.539947509765625, 0.5595016479492188, 0.5790557861328125, 0.5986099243164062, 0.6181640625]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 7.0, 4.0, 6.0, 6.0, 5.0, 7.0, 7.0, 14.0, 23.0, 32.0, 44.0, 54.0, 60.0, 73.0, 85.0, 91.0, 81.0, 84.0, 58.0, 68.0, 58.0, 36.0, 32.0, 17.0, 17.0, 15.0, 7.0, 5.0, 1.0, 6.0, 3.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00699615478515625, -0.006795704364776611, -0.006595253944396973, -0.006394803524017334, -0.006194353103637695, -0.005993902683258057, -0.005793452262878418, -0.005593001842498779, -0.005392551422119141, -0.005192101001739502, -0.004991650581359863, -0.004791200160980225, -0.004590749740600586, -0.004390299320220947, -0.004189848899841309, -0.00398939847946167, -0.0037889480590820312, -0.0035884976387023926, -0.003388047218322754, -0.0031875967979431152, -0.0029871463775634766, -0.002786695957183838, -0.0025862455368041992, -0.0023857951164245605, -0.002185344696044922, -0.001984894275665283, -0.0017844438552856445, -0.0015839934349060059, -0.0013835430145263672, -0.0011830925941467285, -0.0009826421737670898, -0.0007821917533874512, -0.0005817413330078125, -0.00038129091262817383, -0.00018084049224853516, 1.9609928131103516e-05, 0.0002200603485107422, 0.00042051076889038086, 0.0006209611892700195, 0.0008214116096496582, 0.0010218620300292969, 0.0012223124504089355, 0.0014227628707885742, 0.0016232132911682129, 0.0018236637115478516, 0.0020241141319274902, 0.002224564552307129, 0.0024250149726867676, 0.0026254653930664062, 0.002825915813446045, 0.0030263662338256836, 0.0032268166542053223, 0.003427267074584961, 0.0036277174949645996, 0.0038281679153442383, 0.004028618335723877, 0.004229068756103516, 0.004429519176483154, 0.004629969596862793, 0.004830420017242432, 0.00503087043762207, 0.005231320858001709, 0.005431771278381348, 0.005632221698760986, 0.005832672119140625]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 3.0, 5.0, 14.0, 13.0, 7.0, 25.0, 29.0, 34.0, 66.0, 82.0, 149.0, 165.0, 329.0, 803.0, 60574.0, 983653.0, 1463.0, 432.0, 224.0, 149.0, 100.0, 72.0, 36.0, 31.0, 21.0, 14.0, 10.0, 16.0, 7.0, 7.0, 6.0, 3.0, 5.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11328125, -0.10939979553222656, -0.10551834106445312, -0.10163688659667969, -0.09775543212890625, -0.09387397766113281, -0.08999252319335938, -0.08611106872558594, -0.0822296142578125, -0.07834815979003906, -0.07446670532226562, -0.07058525085449219, -0.06670379638671875, -0.06282234191894531, -0.058940887451171875, -0.05505943298339844, -0.051177978515625, -0.04729652404785156, -0.043415069580078125, -0.03953361511230469, -0.03565216064453125, -0.03177070617675781, -0.027889251708984375, -0.024007797241210938, -0.0201263427734375, -0.016244888305664062, -0.012363433837890625, -0.008481979370117188, -0.00460052490234375, -0.0007190704345703125, 0.003162384033203125, 0.0070438385009765625, 0.01092529296875, 0.014806747436523438, 0.018688201904296875, 0.022569656372070312, 0.02645111083984375, 0.030332565307617188, 0.034214019775390625, 0.03809547424316406, 0.0419769287109375, 0.04585838317871094, 0.049739837646484375, 0.05362129211425781, 0.05750274658203125, 0.06138420104980469, 0.06526565551757812, 0.06914710998535156, 0.073028564453125, 0.07691001892089844, 0.08079147338867188, 0.08467292785644531, 0.08855438232421875, 0.09243583679199219, 0.09631729125976562, 0.10019874572753906, 0.1040802001953125, 0.10796165466308594, 0.11184310913085938, 0.11572456359863281, 0.11960601806640625, 0.12348747253417969, 0.12736892700195312, 0.13125038146972656, 0.1351318359375]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 268.0, 748.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06338192522525787, -0.061718348413705826, -0.06005476787686348, -0.05839119106531143, -0.056727610528469086, -0.05506403371691704, -0.05340045690536499, -0.051736876368522644, -0.0500732958316803, -0.04840971902012825, -0.046746138483285904, -0.045082561671733856, -0.04341898113489151, -0.04175540432333946, -0.040091827511787415, -0.03842824697494507, -0.03676467016339302, -0.03510109335184097, -0.03343751281499863, -0.03177393600344658, -0.030110355466604233, -0.028446778655052185, -0.026783199980854988, -0.02511962130665779, -0.023456042632460594, -0.021792463958263397, -0.0201288852840662, -0.018465306609869003, -0.016801729798316956, -0.015138150192797184, -0.013474572449922562, -0.011810993775725365, -0.010147418826818466, -0.00848384015262127, -0.00682026194408536, -0.00515668373554945, -0.003493105061352253, -0.001829526387155056, -0.00016594864428043365, 0.0014976300299167633, 0.0031612087041139603, 0.004824787378311157, 0.006488365586847067, 0.008151943795382977, 0.009815522469580173, 0.01147910114377737, 0.013142678886651993, 0.01480625756084919, 0.016469836235046387, 0.018133414909243584, 0.01979699358344078, 0.02146057039499283, 0.023124150931835175, 0.024787727743387222, 0.02645130641758442, 0.028114885091781616, 0.029778463765978813, 0.03144204244017601, 0.03310561925172806, 0.034769199788570404, 0.03643277660012245, 0.0380963571369648, 0.039759933948516846, 0.04142351448535919, 0.04308709129691124]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 2.0, 4.0, 10.0, 13.0, 14.0, 13.0, 23.0, 27.0, 28.0, 33.0, 23.0, 26.0, 39.0, 35.0, 37.0, 45.0, 52.0, 52.0, 41.0, 54.0, 51.0, 47.0, 44.0, 49.0, 37.0, 30.0, 33.0, 34.0, 17.0, 19.0, 15.0, 19.0, 13.0, 8.0, 3.0, 5.0, 3.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0024068355560302734, -0.002306555397808552, -0.00220627523958683, -0.0021059950813651085, -0.002005714923143387, -0.0019054347649216652, -0.0018051546066999435, -0.001704874448478222, -0.0016045942902565002, -0.0015043141320347786, -0.001404033973813057, -0.0013037538155913353, -0.0012034736573696136, -0.001103193499147892, -0.0010029133409261703, -0.0009026331827044487, -0.000802353024482727, -0.0007020728662610054, -0.0006017927080392838, -0.0005015125498175621, -0.00040123239159584045, -0.0003009522333741188, -0.00020067207515239716, -0.0001003919169306755, -1.1175870895385742e-07, 0.00010016839951276779, 0.00020044855773448944, 0.0003007287159562111, 0.00040100887417793274, 0.0005012890323996544, 0.000601569190621376, 0.0007018493488430977, 0.0008021295070648193, 0.000902409665286541, 0.0010026898235082626, 0.0011029699817299843, 0.001203250139951706, 0.0013035302981734276, 0.0014038104563951492, 0.0015040906146168709, 0.0016043707728385925, 0.0017046509310603142, 0.0018049310892820358, 0.0019052112475037575, 0.002005491405725479, 0.0021057715639472008, 0.0022060517221689224, 0.002306331880390644, 0.0024066120386123657, 0.0025068921968340874, 0.002607172355055809, 0.0027074525132775307, 0.0028077326714992523, 0.002908012829720974, 0.0030082929879426956, 0.0031085731461644173, 0.003208853304386139, 0.0033091334626078606, 0.003409413620829582, 0.003509693779051304, 0.0036099739372730255, 0.003710254095494747, 0.003810534253716469, 0.0039108144119381905, 0.004011094570159912]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 5.0, 3.0, 8.0, 5.0, 16.0, 11.0, 8.0, 12.0, 18.0, 14.0, 17.0, 21.0, 32.0, 27.0, 40.0, 29.0, 41.0, 38.0, 33.0, 34.0, 40.0, 30.0, 41.0, 51.0, 41.0, 45.0, 27.0, 47.0, 26.0, 30.0, 30.0, 23.0, 15.0, 22.0, 20.0, 23.0, 13.0, 8.0, 10.0, 11.0, 9.0, 6.0, 4.0, 8.0, 2.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-8.6328125, -8.37945556640625, -8.1260986328125, -7.87274169921875, -7.619384765625, -7.36602783203125, -7.1126708984375, -6.85931396484375, -6.60595703125, -6.35260009765625, -6.0992431640625, -5.84588623046875, -5.592529296875, -5.33917236328125, -5.0858154296875, -4.83245849609375, -4.5791015625, -4.32574462890625, -4.0723876953125, -3.81903076171875, -3.565673828125, -3.31231689453125, -3.0589599609375, -2.80560302734375, -2.55224609375, -2.29888916015625, -2.0455322265625, -1.79217529296875, -1.538818359375, -1.28546142578125, -1.0321044921875, -0.77874755859375, -0.525390625, -0.27203369140625, -0.0186767578125, 0.23468017578125, 0.488037109375, 0.74139404296875, 0.9947509765625, 1.24810791015625, 1.50146484375, 1.75482177734375, 2.0081787109375, 2.26153564453125, 2.514892578125, 2.76824951171875, 3.0216064453125, 3.27496337890625, 3.5283203125, 3.78167724609375, 4.0350341796875, 4.28839111328125, 4.541748046875, 4.79510498046875, 5.0484619140625, 5.30181884765625, 5.55517578125, 5.80853271484375, 6.0618896484375, 6.31524658203125, 6.568603515625, 6.82196044921875, 7.0753173828125, 7.32867431640625, 7.58203125]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 1.0, 3.0, 4.0, 7.0, 6.0, 11.0, 9.0, 13.0, 18.0, 32.0, 29.0, 44.0, 61.0, 66.0, 124.0, 158.0, 272.0, 449.0, 831.0, 1526.0, 3095.0, 6202.0, 13311.0, 29188.0, 69345.0, 198131.0, 457629.0, 160008.0, 59471.0, 25691.0, 11428.0, 5389.0, 2681.0, 1367.0, 733.0, 370.0, 272.0, 172.0, 114.0, 73.0, 50.0, 44.0, 22.0, 31.0, 24.0, 16.0, 12.0, 7.0, 9.0, 5.0, 5.0, 4.0, 2.0, 0.0, 0.0, 3.0], "bins": [-11.0859375, -10.7637939453125, -10.441650390625, -10.1195068359375, -9.79736328125, -9.4752197265625, -9.153076171875, -8.8309326171875, -8.5087890625, -8.1866455078125, -7.864501953125, -7.5423583984375, -7.22021484375, -6.8980712890625, -6.575927734375, -6.2537841796875, -5.931640625, -5.6094970703125, -5.287353515625, -4.9652099609375, -4.64306640625, -4.3209228515625, -3.998779296875, -3.6766357421875, -3.3544921875, -3.0323486328125, -2.710205078125, -2.3880615234375, -2.06591796875, -1.7437744140625, -1.421630859375, -1.0994873046875, -0.77734375, -0.4552001953125, -0.133056640625, 0.1890869140625, 0.51123046875, 0.8333740234375, 1.155517578125, 1.4776611328125, 1.7998046875, 2.1219482421875, 2.444091796875, 2.7662353515625, 3.08837890625, 3.4105224609375, 3.732666015625, 4.0548095703125, 4.376953125, 4.6990966796875, 5.021240234375, 5.3433837890625, 5.66552734375, 5.9876708984375, 6.309814453125, 6.6319580078125, 6.9541015625, 7.2762451171875, 7.598388671875, 7.9205322265625, 8.24267578125, 8.5648193359375, 8.886962890625, 9.2091064453125, 9.53125]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 6.0, 10.0, 10.0, 10.0, 9.0, 16.0, 17.0, 21.0, 27.0, 20.0, 31.0, 22.0, 37.0, 42.0, 43.0, 71.0, 82.0, 138.0, 1518.0, 336.0, 141.0, 70.0, 55.0, 40.0, 28.0, 33.0, 40.0, 21.0, 28.0, 23.0, 20.0, 6.0, 14.0, 11.0, 12.0, 9.0, 10.0, 5.0, 6.0, 4.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-23.40625, -22.6494140625, -21.892578125, -21.1357421875, -20.37890625, -19.6220703125, -18.865234375, -18.1083984375, -17.3515625, -16.5947265625, -15.837890625, -15.0810546875, -14.32421875, -13.5673828125, -12.810546875, -12.0537109375, -11.296875, -10.5400390625, -9.783203125, -9.0263671875, -8.26953125, -7.5126953125, -6.755859375, -5.9990234375, -5.2421875, -4.4853515625, -3.728515625, -2.9716796875, -2.21484375, -1.4580078125, -0.701171875, 0.0556640625, 0.8125, 1.5693359375, 2.326171875, 3.0830078125, 3.83984375, 4.5966796875, 5.353515625, 6.1103515625, 6.8671875, 7.6240234375, 8.380859375, 9.1376953125, 9.89453125, 10.6513671875, 11.408203125, 12.1650390625, 12.921875, 13.6787109375, 14.435546875, 15.1923828125, 15.94921875, 16.7060546875, 17.462890625, 18.2197265625, 18.9765625, 19.7333984375, 20.490234375, 21.2470703125, 22.00390625, 22.7607421875, 23.517578125, 24.2744140625, 25.03125]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 3.0, 4.0, 3.0, 7.0, 7.0, 10.0, 13.0, 19.0, 21.0, 28.0, 44.0, 50.0, 81.0, 102.0, 168.0, 248.0, 467.0, 1680.0, 19162.0, 1968957.0, 1135516.0, 16335.0, 1493.0, 491.0, 229.0, 161.0, 110.0, 79.0, 58.0, 38.0, 34.0, 25.0, 16.0, 15.0, 12.0, 2.0, 6.0, 6.0, 5.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-38.3125, -36.990234375, -35.66796875, -34.345703125, -33.0234375, -31.701171875, -30.37890625, -29.056640625, -27.734375, -26.412109375, -25.08984375, -23.767578125, -22.4453125, -21.123046875, -19.80078125, -18.478515625, -17.15625, -15.833984375, -14.51171875, -13.189453125, -11.8671875, -10.544921875, -9.22265625, -7.900390625, -6.578125, -5.255859375, -3.93359375, -2.611328125, -1.2890625, 0.033203125, 1.35546875, 2.677734375, 4.0, 5.322265625, 6.64453125, 7.966796875, 9.2890625, 10.611328125, 11.93359375, 13.255859375, 14.578125, 15.900390625, 17.22265625, 18.544921875, 19.8671875, 21.189453125, 22.51171875, 23.833984375, 25.15625, 26.478515625, 27.80078125, 29.123046875, 30.4453125, 31.767578125, 33.08984375, 34.412109375, 35.734375, 37.056640625, 38.37890625, 39.701171875, 41.0234375, 42.345703125, 43.66796875, 44.990234375, 46.3125]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 260.0, 748.0, 8.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-568.1582641601562, -556.3590087890625, -544.5596923828125, -532.7604370117188, -520.961181640625, -509.1618957519531, -497.36260986328125, -485.5633544921875, -473.76409912109375, -461.9648132324219, -450.1655578613281, -438.36627197265625, -426.5670166015625, -414.7677307128906, -402.96844482421875, -391.169189453125, -379.3699035644531, -367.57061767578125, -355.7713623046875, -343.9720764160156, -332.1728210449219, -320.37353515625, -308.57427978515625, -296.7749938964844, -284.9757080078125, -273.1764221191406, -261.3771667480469, -249.577880859375, -237.77862548828125, -225.97933959960938, -214.18006896972656, -202.38079833984375, -190.58151245117188, -178.78224182128906, -166.98297119140625, -155.18368530273438, -143.38442993164062, -131.58514404296875, -119.78587341308594, -107.98660278320312, -96.18733215332031, -84.3880615234375, -72.58879089355469, -60.789512634277344, -48.99024200439453, -37.19097137451172, -25.391693115234375, -13.592422485351562, -1.79315185546875, 10.006120681762695, 21.80539321899414, 33.60466766357422, 45.40393829345703, 57.203208923339844, 69.00248718261719, 80.8017578125, 92.60102844238281, 104.40029907226562, 116.19956970214844, 127.99884796142578, 139.79812622070312, 151.59738159179688, 163.39666748046875, 175.19593811035156, 186.99520874023438]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 2.0, 4.0, 8.0, 7.0, 0.0, 9.0, 8.0, 7.0, 17.0, 18.0, 16.0, 12.0, 15.0, 24.0, 21.0, 30.0, 23.0, 27.0, 26.0, 35.0, 28.0, 44.0, 33.0, 38.0, 30.0, 36.0, 30.0, 31.0, 38.0, 37.0, 48.0, 29.0, 23.0, 37.0, 31.0, 22.0, 25.0, 28.0, 14.0, 19.0, 10.0, 15.0, 7.0, 6.0, 6.0, 7.0, 7.0, 5.0, 4.0, 2.0, 5.0, 1.0, 7.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-41.95530700683594, -40.405799865722656, -38.856292724609375, -37.306785583496094, -35.75727844238281, -34.20777130126953, -32.65826416015625, -31.10875701904297, -29.559249877929688, -28.009742736816406, -26.460235595703125, -24.910728454589844, -23.361221313476562, -21.81171417236328, -20.26220703125, -18.71269989013672, -17.163192749023438, -15.613685607910156, -14.064178466796875, -12.514671325683594, -10.965164184570312, -9.415657043457031, -7.86614990234375, -6.316642761230469, -4.7671356201171875, -3.2176284790039062, -1.668121337890625, -0.11861419677734375, 1.4308929443359375, 2.9804000854492188, 4.5299072265625, 6.079414367675781, 7.6289215087890625, 9.178428649902344, 10.727935791015625, 12.277442932128906, 13.826950073242188, 15.376457214355469, 16.92596435546875, 18.47547149658203, 20.024978637695312, 21.574485778808594, 23.123992919921875, 24.673500061035156, 26.223007202148438, 27.77251434326172, 29.322021484375, 30.87152862548828, 32.42103576660156, 33.970542907714844, 35.520050048828125, 37.069557189941406, 38.61906433105469, 40.16857147216797, 41.71807861328125, 43.26758575439453, 44.81709289550781, 46.366600036621094, 47.916107177734375, 49.465614318847656, 51.01512145996094, 52.56462860107422, 54.1141357421875, 55.66364288330078, 57.21315002441406]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 5.0, 6.0, 4.0, 5.0, 8.0, 9.0, 18.0, 15.0, 10.0, 12.0, 21.0, 24.0, 21.0, 46.0, 34.0, 40.0, 46.0, 40.0, 26.0, 48.0, 28.0, 31.0, 47.0, 47.0, 52.0, 37.0, 36.0, 33.0, 27.0, 31.0, 33.0, 21.0, 30.0, 25.0, 16.0, 11.0, 7.0, 6.0, 6.0, 14.0, 4.0, 4.0, 7.0, 5.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.6484375, -8.375732421875, -8.10302734375, -7.830322265625, -7.5576171875, -7.284912109375, -7.01220703125, -6.739501953125, -6.466796875, -6.194091796875, -5.92138671875, -5.648681640625, -5.3759765625, -5.103271484375, -4.83056640625, -4.557861328125, -4.28515625, -4.012451171875, -3.73974609375, -3.467041015625, -3.1943359375, -2.921630859375, -2.64892578125, -2.376220703125, -2.103515625, -1.830810546875, -1.55810546875, -1.285400390625, -1.0126953125, -0.739990234375, -0.46728515625, -0.194580078125, 0.078125, 0.350830078125, 0.62353515625, 0.896240234375, 1.1689453125, 1.441650390625, 1.71435546875, 1.987060546875, 2.259765625, 2.532470703125, 2.80517578125, 3.077880859375, 3.3505859375, 3.623291015625, 3.89599609375, 4.168701171875, 4.44140625, 4.714111328125, 4.98681640625, 5.259521484375, 5.5322265625, 5.804931640625, 6.07763671875, 6.350341796875, 6.623046875, 6.895751953125, 7.16845703125, 7.441162109375, 7.7138671875, 7.986572265625, 8.25927734375, 8.531982421875, 8.8046875]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 7.0, 8.0, 9.0, 9.0, 13.0, 14.0, 18.0, 26.0, 47.0, 73.0, 119.0, 211.0, 379.0, 831.0, 1678.0, 4016.0, 10589.0, 36519.0, 281811.0, 2475834.0, 1247579.0, 101924.0, 20492.0, 6864.0, 2772.0, 1161.0, 576.0, 285.0, 162.0, 69.0, 56.0, 28.0, 28.0, 21.0, 9.0, 5.0, 10.0, 8.0, 6.0, 5.0, 5.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.21875, -17.607177734375, -16.99560546875, -16.384033203125, -15.7724609375, -15.160888671875, -14.54931640625, -13.937744140625, -13.326171875, -12.714599609375, -12.10302734375, -11.491455078125, -10.8798828125, -10.268310546875, -9.65673828125, -9.045166015625, -8.43359375, -7.822021484375, -7.21044921875, -6.598876953125, -5.9873046875, -5.375732421875, -4.76416015625, -4.152587890625, -3.541015625, -2.929443359375, -2.31787109375, -1.706298828125, -1.0947265625, -0.483154296875, 0.12841796875, 0.739990234375, 1.3515625, 1.963134765625, 2.57470703125, 3.186279296875, 3.7978515625, 4.409423828125, 5.02099609375, 5.632568359375, 6.244140625, 6.855712890625, 7.46728515625, 8.078857421875, 8.6904296875, 9.302001953125, 9.91357421875, 10.525146484375, 11.13671875, 11.748291015625, 12.35986328125, 12.971435546875, 13.5830078125, 14.194580078125, 14.80615234375, 15.417724609375, 16.029296875, 16.640869140625, 17.25244140625, 17.864013671875, 18.4755859375, 19.087158203125, 19.69873046875, 20.310302734375, 20.921875]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 2.0, 2.0, 3.0, 2.0, 4.0, 13.0, 10.0, 8.0, 19.0, 24.0, 22.0, 21.0, 26.0, 57.0, 59.0, 72.0, 97.0, 139.0, 182.0, 291.0, 385.0, 476.0, 528.0, 484.0, 353.0, 220.0, 149.0, 98.0, 87.0, 59.0, 49.0, 27.0, 32.0, 19.0, 8.0, 13.0, 14.0, 5.0, 5.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.7578125, -11.36865234375, -10.9794921875, -10.59033203125, -10.201171875, -9.81201171875, -9.4228515625, -9.03369140625, -8.64453125, -8.25537109375, -7.8662109375, -7.47705078125, -7.087890625, -6.69873046875, -6.3095703125, -5.92041015625, -5.53125, -5.14208984375, -4.7529296875, -4.36376953125, -3.974609375, -3.58544921875, -3.1962890625, -2.80712890625, -2.41796875, -2.02880859375, -1.6396484375, -1.25048828125, -0.861328125, -0.47216796875, -0.0830078125, 0.30615234375, 0.6953125, 1.08447265625, 1.4736328125, 1.86279296875, 2.251953125, 2.64111328125, 3.0302734375, 3.41943359375, 3.80859375, 4.19775390625, 4.5869140625, 4.97607421875, 5.365234375, 5.75439453125, 6.1435546875, 6.53271484375, 6.921875, 7.31103515625, 7.7001953125, 8.08935546875, 8.478515625, 8.86767578125, 9.2568359375, 9.64599609375, 10.03515625, 10.42431640625, 10.8134765625, 11.20263671875, 11.591796875, 11.98095703125, 12.3701171875, 12.75927734375, 13.1484375]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 0.0, 4.0, 1.0, 3.0, 10.0, 6.0, 12.0, 20.0, 30.0, 28.0, 57.0, 63.0, 113.0, 174.0, 333.0, 624.0, 1487.0, 3482.0, 10410.0, 36931.0, 179319.0, 2119541.0, 1646334.0, 149476.0, 31126.0, 8838.0, 3092.0, 1328.0, 572.0, 304.0, 166.0, 105.0, 87.0, 50.0, 36.0, 20.0, 25.0, 17.0, 8.0, 9.0, 12.0, 9.0, 5.0, 5.0, 6.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.84375, -19.20263671875, -18.5615234375, -17.92041015625, -17.279296875, -16.63818359375, -15.9970703125, -15.35595703125, -14.71484375, -14.07373046875, -13.4326171875, -12.79150390625, -12.150390625, -11.50927734375, -10.8681640625, -10.22705078125, -9.5859375, -8.94482421875, -8.3037109375, -7.66259765625, -7.021484375, -6.38037109375, -5.7392578125, -5.09814453125, -4.45703125, -3.81591796875, -3.1748046875, -2.53369140625, -1.892578125, -1.25146484375, -0.6103515625, 0.03076171875, 0.671875, 1.31298828125, 1.9541015625, 2.59521484375, 3.236328125, 3.87744140625, 4.5185546875, 5.15966796875, 5.80078125, 6.44189453125, 7.0830078125, 7.72412109375, 8.365234375, 9.00634765625, 9.6474609375, 10.28857421875, 10.9296875, 11.57080078125, 12.2119140625, 12.85302734375, 13.494140625, 14.13525390625, 14.7763671875, 15.41748046875, 16.05859375, 16.69970703125, 17.3408203125, 17.98193359375, 18.623046875, 19.26416015625, 19.9052734375, 20.54638671875, 21.1875]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 19.0, 44.0, 139.0, 290.0, 281.0, 151.0, 56.0, 19.0, 6.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-126.59783935546875, -122.66924285888672, -118.74064636230469, -114.81204986572266, -110.88345336914062, -106.9548568725586, -103.02626037597656, -99.09766387939453, -95.1690673828125, -91.24047088623047, -87.31187438964844, -83.3832778930664, -79.45468139648438, -75.52608489990234, -71.59748840332031, -67.66889190673828, -63.74029541015625, -59.81169891357422, -55.88310241699219, -51.954505920410156, -48.025909423828125, -44.097312927246094, -40.16871643066406, -36.24011993408203, -32.3115234375, -28.38292694091797, -24.454330444335938, -20.525733947753906, -16.597137451171875, -12.668540954589844, -8.739944458007812, -4.811347961425781, -0.8827438354492188, 3.0458526611328125, 6.974449157714844, 10.903045654296875, 14.831642150878906, 18.760238647460938, 22.68883514404297, 26.617431640625, 30.54602813720703, 34.47462463378906, 38.403221130371094, 42.331817626953125, 46.260414123535156, 50.18901062011719, 54.11760711669922, 58.04620361328125, 61.97480010986328, 65.90339660644531, 69.83199310302734, 73.76058959960938, 77.6891860961914, 81.61778259277344, 85.54637908935547, 89.4749755859375, 93.40357208251953, 97.33216857910156, 101.2607650756836, 105.18936157226562, 109.11795806884766, 113.04655456542969, 116.97515106201172, 120.90374755859375, 124.83234405517578]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 5.0, 5.0, 4.0, 10.0, 19.0, 15.0, 12.0, 18.0, 27.0, 24.0, 28.0, 19.0, 28.0, 29.0, 31.0, 40.0, 38.0, 35.0, 44.0, 65.0, 36.0, 57.0, 39.0, 44.0, 39.0, 36.0, 31.0, 28.0, 37.0, 24.0, 18.0, 17.0, 18.0, 24.0, 10.0, 15.0, 3.0, 3.0, 10.0, 9.0, 4.0, 3.0, 4.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-46.79145812988281, -45.34745788574219, -43.9034538269043, -42.45945358276367, -41.01544952392578, -39.571449279785156, -38.12744903564453, -36.683448791503906, -35.239444732666016, -33.79544448852539, -32.3514404296875, -30.907440185546875, -29.463438034057617, -28.01943588256836, -26.575435638427734, -25.131433486938477, -23.68743133544922, -22.24342918395996, -20.799427032470703, -19.355426788330078, -17.91142463684082, -16.467422485351562, -15.023421287536621, -13.57942008972168, -12.135417938232422, -10.691415786743164, -9.247414588928223, -7.803412914276123, -6.359411239624023, -4.915409564971924, -3.471407890319824, -2.027406692504883, -0.583404541015625, 0.8605971336364746, 2.304598808288574, 3.748600482940674, 5.192602157592773, 6.636603832244873, 8.080605506896973, 9.524606704711914, 10.968608856201172, 12.41261100769043, 13.856612205505371, 15.300613403320312, 16.74461555480957, 18.188617706298828, 19.632617950439453, 21.07662010192871, 22.52062225341797, 23.964624404907227, 25.408626556396484, 26.85262680053711, 28.296628952026367, 29.740631103515625, 31.18463134765625, 32.628631591796875, 34.072635650634766, 35.51663589477539, 36.96063995361328, 38.404640197753906, 39.84864044189453, 41.29264450073242, 42.73664474487305, 44.18064880371094, 45.62464904785156]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 2.0, 5.0, 5.0, 5.0, 4.0, 13.0, 7.0, 8.0, 14.0, 8.0, 21.0, 8.0, 12.0, 20.0, 27.0, 27.0, 32.0, 25.0, 31.0, 31.0, 31.0, 33.0, 41.0, 38.0, 34.0, 40.0, 46.0, 35.0, 31.0, 37.0, 32.0, 38.0, 18.0, 25.0, 42.0, 18.0, 17.0, 14.0, 14.0, 16.0, 16.0, 8.0, 12.0, 12.0, 10.0, 8.0, 9.0, 3.0, 4.0, 3.0, 6.0, 3.0, 2.0, 4.0, 2.0, 2.0, 0.0, 2.0], "bins": [-7.73828125, -7.49237060546875, -7.2464599609375, -7.00054931640625, -6.754638671875, -6.50872802734375, -6.2628173828125, -6.01690673828125, -5.77099609375, -5.52508544921875, -5.2791748046875, -5.03326416015625, -4.787353515625, -4.54144287109375, -4.2955322265625, -4.04962158203125, -3.8037109375, -3.55780029296875, -3.3118896484375, -3.06597900390625, -2.820068359375, -2.57415771484375, -2.3282470703125, -2.08233642578125, -1.83642578125, -1.59051513671875, -1.3446044921875, -1.09869384765625, -0.852783203125, -0.60687255859375, -0.3609619140625, -0.11505126953125, 0.130859375, 0.37677001953125, 0.6226806640625, 0.86859130859375, 1.114501953125, 1.36041259765625, 1.6063232421875, 1.85223388671875, 2.09814453125, 2.34405517578125, 2.5899658203125, 2.83587646484375, 3.081787109375, 3.32769775390625, 3.5736083984375, 3.81951904296875, 4.0654296875, 4.31134033203125, 4.5572509765625, 4.80316162109375, 5.049072265625, 5.29498291015625, 5.5408935546875, 5.78680419921875, 6.03271484375, 6.27862548828125, 6.5245361328125, 6.77044677734375, 7.016357421875, 7.26226806640625, 7.5081787109375, 7.75408935546875, 8.0]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 4.0, 9.0, 7.0, 15.0, 28.0, 45.0, 76.0, 100.0, 138.0, 287.0, 422.0, 621.0, 975.0, 1593.0, 2414.0, 3662.0, 5509.0, 8398.0, 12881.0, 19744.0, 29915.0, 45489.0, 69748.0, 102557.0, 142764.0, 165714.0, 139976.0, 100131.0, 67459.0, 43936.0, 29116.0, 18868.0, 12353.0, 8225.0, 5373.0, 3490.0, 2308.0, 1507.0, 924.0, 655.0, 433.0, 233.0, 173.0, 115.0, 65.0, 38.0, 25.0, 19.0, 7.0, 12.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.7734375, -0.7496109008789062, -0.7257843017578125, -0.7019577026367188, -0.678131103515625, -0.6543045043945312, -0.6304779052734375, -0.6066513061523438, -0.58282470703125, -0.5589981079101562, -0.5351715087890625, -0.5113449096679688, -0.487518310546875, -0.46369171142578125, -0.4398651123046875, -0.41603851318359375, -0.3922119140625, -0.36838531494140625, -0.3445587158203125, -0.32073211669921875, -0.296905517578125, -0.27307891845703125, -0.2492523193359375, -0.22542572021484375, -0.20159912109375, -0.17777252197265625, -0.1539459228515625, -0.13011932373046875, -0.106292724609375, -0.08246612548828125, -0.0586395263671875, -0.03481292724609375, -0.010986328125, 0.01284027099609375, 0.0366668701171875, 0.06049346923828125, 0.084320068359375, 0.10814666748046875, 0.1319732666015625, 0.15579986572265625, 0.17962646484375, 0.20345306396484375, 0.2272796630859375, 0.25110626220703125, 0.274932861328125, 0.29875946044921875, 0.3225860595703125, 0.34641265869140625, 0.3702392578125, 0.39406585693359375, 0.4178924560546875, 0.44171905517578125, 0.465545654296875, 0.48937225341796875, 0.5131988525390625, 0.5370254516601562, 0.56085205078125, 0.5846786499023438, 0.6085052490234375, 0.6323318481445312, 0.656158447265625, 0.6799850463867188, 0.7038116455078125, 0.7276382446289062, 0.75146484375]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 4.0, 7.0, 18.0, 14.0, 13.0, 26.0, 22.0, 30.0, 33.0, 30.0, 28.0, 34.0, 40.0, 46.0, 54.0, 47.0, 44.0, 1087.0, 55.0, 54.0, 40.0, 33.0, 46.0, 30.0, 30.0, 29.0, 31.0, 24.0, 17.0, 10.0, 16.0, 13.0, 11.0, 2.0, 3.0, 9.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-7.046875, -6.83404541015625, -6.6212158203125, -6.40838623046875, -6.195556640625, -5.98272705078125, -5.7698974609375, -5.55706787109375, -5.34423828125, -5.13140869140625, -4.9185791015625, -4.70574951171875, -4.492919921875, -4.28009033203125, -4.0672607421875, -3.85443115234375, -3.6416015625, -3.42877197265625, -3.2159423828125, -3.00311279296875, -2.790283203125, -2.57745361328125, -2.3646240234375, -2.15179443359375, -1.93896484375, -1.72613525390625, -1.5133056640625, -1.30047607421875, -1.087646484375, -0.87481689453125, -0.6619873046875, -0.44915771484375, -0.236328125, -0.02349853515625, 0.1893310546875, 0.40216064453125, 0.614990234375, 0.82781982421875, 1.0406494140625, 1.25347900390625, 1.46630859375, 1.67913818359375, 1.8919677734375, 2.10479736328125, 2.317626953125, 2.53045654296875, 2.7432861328125, 2.95611572265625, 3.1689453125, 3.38177490234375, 3.5946044921875, 3.80743408203125, 4.020263671875, 4.23309326171875, 4.4459228515625, 4.65875244140625, 4.87158203125, 5.08441162109375, 5.2972412109375, 5.51007080078125, 5.722900390625, 5.93572998046875, 6.1485595703125, 6.36138916015625, 6.57421875]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 8.0, 7.0, 15.0, 39.0, 72.0, 74.0, 119.0, 197.0, 319.0, 587.0, 952.0, 1558.0, 2712.0, 4492.0, 7300.0, 12253.0, 20097.0, 33125.0, 53363.0, 84543.0, 127512.0, 233118.0, 1151065.0, 131273.0, 88571.0, 55972.0, 34525.0, 21011.0, 12874.0, 7758.0, 4676.0, 2830.0, 1683.0, 893.0, 634.0, 356.0, 214.0, 140.0, 70.0, 45.0, 35.0, 17.0, 12.0, 12.0, 6.0, 1.0, 0.0, 2.0, 2.0, 3.0], "bins": [-0.8037109375, -0.7814178466796875, -0.759124755859375, -0.7368316650390625, -0.71453857421875, -0.6922454833984375, -0.669952392578125, -0.6476593017578125, -0.6253662109375, -0.6030731201171875, -0.580780029296875, -0.5584869384765625, -0.53619384765625, -0.5139007568359375, -0.491607666015625, -0.4693145751953125, -0.447021484375, -0.4247283935546875, -0.402435302734375, -0.3801422119140625, -0.35784912109375, -0.3355560302734375, -0.313262939453125, -0.2909698486328125, -0.2686767578125, -0.2463836669921875, -0.224090576171875, -0.2017974853515625, -0.17950439453125, -0.1572113037109375, -0.134918212890625, -0.1126251220703125, -0.09033203125, -0.0680389404296875, -0.045745849609375, -0.0234527587890625, -0.00115966796875, 0.0211334228515625, 0.043426513671875, 0.0657196044921875, 0.0880126953125, 0.1103057861328125, 0.132598876953125, 0.1548919677734375, 0.17718505859375, 0.1994781494140625, 0.221771240234375, 0.2440643310546875, 0.266357421875, 0.2886505126953125, 0.310943603515625, 0.3332366943359375, 0.35552978515625, 0.3778228759765625, 0.400115966796875, 0.4224090576171875, 0.4447021484375, 0.4669952392578125, 0.489288330078125, 0.5115814208984375, 0.53387451171875, 0.5561676025390625, 0.578460693359375, 0.6007537841796875, 0.623046875]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 4.0, 1.0, 2.0, 2.0, 1.0, 5.0, 3.0, 6.0, 2.0, 4.0, 8.0, 25.0, 28.0, 33.0, 50.0, 62.0, 69.0, 90.0, 118.0, 123.0, 79.0, 55.0, 68.0, 50.0, 32.0, 20.0, 14.0, 15.0, 7.0, 5.0, 5.0, 2.0, 8.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.006488800048828125, -0.006296992301940918, -0.006105184555053711, -0.005913376808166504, -0.005721569061279297, -0.00552976131439209, -0.005337953567504883, -0.005146145820617676, -0.004954338073730469, -0.004762530326843262, -0.004570722579956055, -0.004378914833068848, -0.004187107086181641, -0.003995299339294434, -0.0038034915924072266, -0.0036116838455200195, -0.0034198760986328125, -0.0032280683517456055, -0.0030362606048583984, -0.0028444528579711914, -0.0026526451110839844, -0.0024608373641967773, -0.0022690296173095703, -0.0020772218704223633, -0.0018854141235351562, -0.0016936063766479492, -0.0015017986297607422, -0.0013099908828735352, -0.0011181831359863281, -0.0009263753890991211, -0.0007345676422119141, -0.000542759895324707, -0.0003509521484375, -0.00015914440155029297, 3.266334533691406e-05, 0.0002244710922241211, 0.0004162788391113281, 0.0006080865859985352, 0.0007998943328857422, 0.0009917020797729492, 0.0011835098266601562, 0.0013753175735473633, 0.0015671253204345703, 0.0017589330673217773, 0.0019507408142089844, 0.0021425485610961914, 0.0023343563079833984, 0.0025261640548706055, 0.0027179718017578125, 0.0029097795486450195, 0.0031015872955322266, 0.0032933950424194336, 0.0034852027893066406, 0.0036770105361938477, 0.0038688182830810547, 0.004060626029968262, 0.004252433776855469, 0.004444241523742676, 0.004636049270629883, 0.00482785701751709, 0.005019664764404297, 0.005211472511291504, 0.005403280258178711, 0.005595088005065918, 0.005786895751953125]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 6.0, 8.0, 13.0, 10.0, 12.0, 21.0, 30.0, 32.0, 50.0, 78.0, 130.0, 188.0, 325.0, 794.0, 23484.0, 1019948.0, 2174.0, 519.0, 234.0, 156.0, 100.0, 82.0, 44.0, 32.0, 8.0, 12.0, 9.0, 12.0, 3.0, 6.0, 1.0, 5.0, 5.0, 2.0, 6.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1087646484375, -0.10517406463623047, -0.10158348083496094, -0.0979928970336914, -0.09440231323242188, -0.09081172943115234, -0.08722114562988281, -0.08363056182861328, -0.08003997802734375, -0.07644939422607422, -0.07285881042480469, -0.06926822662353516, -0.06567764282226562, -0.062087059020996094, -0.05849647521972656, -0.05490589141845703, -0.0513153076171875, -0.04772472381591797, -0.04413414001464844, -0.040543556213378906, -0.036952972412109375, -0.033362388610839844, -0.029771804809570312, -0.02618122100830078, -0.02259063720703125, -0.01900005340576172, -0.015409469604492188, -0.011818885803222656, -0.008228302001953125, -0.004637718200683594, -0.0010471343994140625, 0.0025434494018554688, 0.006134033203125, 0.009724617004394531, 0.013315200805664062, 0.016905784606933594, 0.020496368408203125, 0.024086952209472656, 0.027677536010742188, 0.03126811981201172, 0.03485870361328125, 0.03844928741455078, 0.04203987121582031, 0.045630455017089844, 0.049221038818359375, 0.052811622619628906, 0.05640220642089844, 0.05999279022216797, 0.0635833740234375, 0.06717395782470703, 0.07076454162597656, 0.0743551254272461, 0.07794570922851562, 0.08153629302978516, 0.08512687683105469, 0.08871746063232422, 0.09230804443359375, 0.09589862823486328, 0.09948921203613281, 0.10307979583740234, 0.10667037963867188, 0.1102609634399414, 0.11385154724121094, 0.11744213104248047, 0.12103271484375]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 63.0, 697.0, 237.0, 14.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02969544380903244, -0.029085952788591385, -0.02847646363079548, -0.027866972610354424, -0.027257483452558517, -0.026647992432117462, -0.026038503274321556, -0.0254290122538805, -0.024819523096084595, -0.02421003207564354, -0.023600542917847633, -0.022991051897406578, -0.022381562739610672, -0.021772071719169617, -0.02116258256137371, -0.020553091540932655, -0.01994360238313675, -0.019334111362695694, -0.018724622204899788, -0.018115131184458733, -0.017505642026662827, -0.01689615100622177, -0.016286661848425865, -0.01567717082798481, -0.015067679807543755, -0.014458189718425274, -0.013848699629306793, -0.013239209540188313, -0.012629719451069832, -0.012020229361951351, -0.01141073927283287, -0.010801248252391815, -0.010191758163273335, -0.009582268074154854, -0.008972777985036373, -0.008363287895917892, -0.007753797806799412, -0.007144307717680931, -0.006534817162901163, -0.005925327073782682, -0.005315836984664202, -0.004706346895545721, -0.00409685680642724, -0.003487366484478116, -0.0028778763953596354, -0.0022683863062411547, -0.0016588959842920303, -0.0010494058951735497, -0.00043991580605506897, 0.00016957434127107263, 0.0007790644885972142, 0.0013885546941310167, 0.0019980447832494974, 0.002607534872367978, 0.0032170251943171024, 0.003826515283435583, 0.004436005372554064, 0.0050454954616725445, 0.005654985550791025, 0.006264476105570793, 0.006873966194689274, 0.0074834562838077545, 0.008092946372926235, 0.008702436462044716, 0.009311926551163197]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 5.0, 2.0, 0.0, 4.0, 12.0, 3.0, 7.0, 12.0, 11.0, 8.0, 10.0, 16.0, 16.0, 19.0, 23.0, 25.0, 34.0, 25.0, 31.0, 33.0, 32.0, 38.0, 44.0, 38.0, 46.0, 29.0, 34.0, 43.0, 44.0, 43.0, 35.0, 30.0, 43.0, 33.0, 26.0, 22.0, 21.0, 18.0, 17.0, 16.0, 15.0, 8.0, 6.0, 9.0, 5.0, 10.0, 6.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0020622611045837402, -0.001985718496143818, -0.0019091758877038956, -0.0018326332792639732, -0.001756090670824051, -0.0016795480623841286, -0.0016030054539442062, -0.001526462845504284, -0.0014499202370643616, -0.0013733776286244392, -0.001296835020184517, -0.0012202924117445946, -0.0011437498033046722, -0.00106720719486475, -0.0009906645864248276, -0.0009141219779849052, -0.0008375793695449829, -0.0007610367611050606, -0.0006844941526651382, -0.0006079515442252159, -0.0005314089357852936, -0.00045486632734537125, -0.0003783237189054489, -0.0003017811104655266, -0.00022523850202560425, -0.00014869589358568192, -7.215328514575958e-05, 4.38932329416275e-06, 8.093193173408508e-05, 0.00015747454017400742, 0.00023401714861392975, 0.0003105597570538521, 0.0003871023654937744, 0.00046364497393369675, 0.0005401875823736191, 0.0006167301908135414, 0.0006932727992534637, 0.0007698154076933861, 0.0008463580161333084, 0.0009229006245732307, 0.000999443233013153, 0.0010759858414530754, 0.0011525284498929977, 0.00122907105833292, 0.0013056136667728424, 0.0013821562752127647, 0.001458698883652687, 0.0015352414920926094, 0.0016117841005325317, 0.001688326708972454, 0.0017648693174123764, 0.0018414119258522987, 0.001917954534292221, 0.0019944971427321434, 0.0020710397511720657, 0.002147582359611988, 0.0022241249680519104, 0.0023006675764918327, 0.002377210184931755, 0.0024537527933716774, 0.0025302954018115997, 0.002606838010251522, 0.0026833806186914444, 0.0027599232271313667, 0.002836465835571289]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 2.0, 5.0, 5.0, 5.0, 4.0, 13.0, 7.0, 8.0, 14.0, 8.0, 21.0, 8.0, 12.0, 20.0, 27.0, 27.0, 32.0, 25.0, 31.0, 31.0, 31.0, 33.0, 41.0, 38.0, 34.0, 40.0, 46.0, 35.0, 31.0, 36.0, 33.0, 38.0, 18.0, 25.0, 42.0, 18.0, 17.0, 14.0, 14.0, 16.0, 16.0, 8.0, 12.0, 12.0, 10.0, 8.0, 9.0, 3.0, 4.0, 3.0, 6.0, 3.0, 2.0, 4.0, 2.0, 2.0, 0.0, 2.0], "bins": [-7.73828125, -7.49237060546875, -7.2464599609375, -7.00054931640625, -6.754638671875, -6.50872802734375, -6.2628173828125, -6.01690673828125, -5.77099609375, -5.52508544921875, -5.2791748046875, -5.03326416015625, -4.787353515625, -4.54144287109375, -4.2955322265625, -4.04962158203125, -3.8037109375, -3.55780029296875, -3.3118896484375, -3.06597900390625, -2.820068359375, -2.57415771484375, -2.3282470703125, -2.08233642578125, -1.83642578125, -1.59051513671875, -1.3446044921875, -1.09869384765625, -0.852783203125, -0.60687255859375, -0.3609619140625, -0.11505126953125, 0.130859375, 0.37677001953125, 0.6226806640625, 0.86859130859375, 1.114501953125, 1.36041259765625, 1.6063232421875, 1.85223388671875, 2.09814453125, 2.34405517578125, 2.5899658203125, 2.83587646484375, 3.081787109375, 3.32769775390625, 3.5736083984375, 3.81951904296875, 4.0654296875, 4.31134033203125, 4.5572509765625, 4.80316162109375, 5.049072265625, 5.29498291015625, 5.5408935546875, 5.78680419921875, 6.03271484375, 6.27862548828125, 6.5245361328125, 6.77044677734375, 7.016357421875, 7.26226806640625, 7.5081787109375, 7.75408935546875, 8.0]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 5.0, 9.0, 9.0, 12.0, 20.0, 24.0, 36.0, 46.0, 63.0, 73.0, 103.0, 152.0, 177.0, 276.0, 378.0, 535.0, 809.0, 1350.0, 2199.0, 4275.0, 8286.0, 17543.0, 39348.0, 94978.0, 310848.0, 370471.0, 111253.0, 44667.0, 19946.0, 9313.0, 4657.0, 2453.0, 1409.0, 865.0, 559.0, 376.0, 250.0, 195.0, 141.0, 96.0, 99.0, 68.0, 59.0, 33.0, 28.0, 19.0, 14.0, 8.0, 11.0, 1.0, 5.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0], "bins": [-9.7265625, -9.42333984375, -9.1201171875, -8.81689453125, -8.513671875, -8.21044921875, -7.9072265625, -7.60400390625, -7.30078125, -6.99755859375, -6.6943359375, -6.39111328125, -6.087890625, -5.78466796875, -5.4814453125, -5.17822265625, -4.875, -4.57177734375, -4.2685546875, -3.96533203125, -3.662109375, -3.35888671875, -3.0556640625, -2.75244140625, -2.44921875, -2.14599609375, -1.8427734375, -1.53955078125, -1.236328125, -0.93310546875, -0.6298828125, -0.32666015625, -0.0234375, 0.27978515625, 0.5830078125, 0.88623046875, 1.189453125, 1.49267578125, 1.7958984375, 2.09912109375, 2.40234375, 2.70556640625, 3.0087890625, 3.31201171875, 3.615234375, 3.91845703125, 4.2216796875, 4.52490234375, 4.828125, 5.13134765625, 5.4345703125, 5.73779296875, 6.041015625, 6.34423828125, 6.6474609375, 6.95068359375, 7.25390625, 7.55712890625, 7.8603515625, 8.16357421875, 8.466796875, 8.77001953125, 9.0732421875, 9.37646484375, 9.6796875]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 3.0, 5.0, 5.0, 6.0, 14.0, 5.0, 7.0, 11.0, 17.0, 12.0, 13.0, 24.0, 18.0, 36.0, 35.0, 29.0, 24.0, 49.0, 52.0, 67.0, 80.0, 151.0, 1480.0, 314.0, 124.0, 75.0, 48.0, 40.0, 40.0, 41.0, 33.0, 31.0, 26.0, 24.0, 14.0, 18.0, 24.0, 14.0, 6.0, 15.0, 8.0, 5.0, 4.0, 3.0, 4.0, 7.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.796875, -17.134521484375, -16.47216796875, -15.809814453125, -15.1474609375, -14.485107421875, -13.82275390625, -13.160400390625, -12.498046875, -11.835693359375, -11.17333984375, -10.510986328125, -9.8486328125, -9.186279296875, -8.52392578125, -7.861572265625, -7.19921875, -6.536865234375, -5.87451171875, -5.212158203125, -4.5498046875, -3.887451171875, -3.22509765625, -2.562744140625, -1.900390625, -1.238037109375, -0.57568359375, 0.086669921875, 0.7490234375, 1.411376953125, 2.07373046875, 2.736083984375, 3.3984375, 4.060791015625, 4.72314453125, 5.385498046875, 6.0478515625, 6.710205078125, 7.37255859375, 8.034912109375, 8.697265625, 9.359619140625, 10.02197265625, 10.684326171875, 11.3466796875, 12.009033203125, 12.67138671875, 13.333740234375, 13.99609375, 14.658447265625, 15.32080078125, 15.983154296875, 16.6455078125, 17.307861328125, 17.97021484375, 18.632568359375, 19.294921875, 19.957275390625, 20.61962890625, 21.281982421875, 21.9443359375, 22.606689453125, 23.26904296875, 23.931396484375, 24.59375]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 3.0, 2.0, 3.0, 6.0, 17.0, 13.0, 21.0, 25.0, 29.0, 41.0, 70.0, 91.0, 165.0, 250.0, 450.0, 1363.0, 18100.0, 2900034.0, 218769.0, 4581.0, 736.0, 316.0, 203.0, 118.0, 72.0, 52.0, 51.0, 39.0, 29.0, 15.0, 11.0, 7.0, 11.0, 6.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.90625, -41.30419921875, -39.7021484375, -38.10009765625, -36.498046875, -34.89599609375, -33.2939453125, -31.69189453125, -30.08984375, -28.48779296875, -26.8857421875, -25.28369140625, -23.681640625, -22.07958984375, -20.4775390625, -18.87548828125, -17.2734375, -15.67138671875, -14.0693359375, -12.46728515625, -10.865234375, -9.26318359375, -7.6611328125, -6.05908203125, -4.45703125, -2.85498046875, -1.2529296875, 0.34912109375, 1.951171875, 3.55322265625, 5.1552734375, 6.75732421875, 8.359375, 9.96142578125, 11.5634765625, 13.16552734375, 14.767578125, 16.36962890625, 17.9716796875, 19.57373046875, 21.17578125, 22.77783203125, 24.3798828125, 25.98193359375, 27.583984375, 29.18603515625, 30.7880859375, 32.39013671875, 33.9921875, 35.59423828125, 37.1962890625, 38.79833984375, 40.400390625, 42.00244140625, 43.6044921875, 45.20654296875, 46.80859375, 48.41064453125, 50.0126953125, 51.61474609375, 53.216796875, 54.81884765625, 56.4208984375, 58.02294921875, 59.625]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 33.0, 93.0, 286.0, 353.0, 184.0, 46.0, 14.0, 2.0, 3.0, 1.0], "bins": [-146.693359375, -144.13621520996094, -141.5790557861328, -139.02191162109375, -136.46475219726562, -133.90760803222656, -131.3504638671875, -128.79330444335938, -126.23616027832031, -123.67900848388672, -121.12185668945312, -118.56471252441406, -116.00756072998047, -113.45040893554688, -110.89325714111328, -108.33610534667969, -105.7789535522461, -103.2218017578125, -100.6646499633789, -98.10750579833984, -95.55035400390625, -92.99320220947266, -90.43605041503906, -87.87889862060547, -85.32174682617188, -82.76459503173828, -80.20744323730469, -77.65029907226562, -75.09314727783203, -72.53599548339844, -69.97884368896484, -67.42169189453125, -64.86454010009766, -62.30738830566406, -59.750240325927734, -57.19308853149414, -54.63594055175781, -52.07878875732422, -49.521636962890625, -46.96448516845703, -44.40734100341797, -41.850189208984375, -39.29304122924805, -36.73588943481445, -34.178741455078125, -31.62158966064453, -29.064437866210938, -26.507287979125977, -23.950136184692383, -21.392986297607422, -18.835834503173828, -16.278684616088867, -13.721534729003906, -11.164384841918945, -8.607234001159668, -6.050083160400391, -3.4929332733154297, -0.9357829093933105, 1.6213674545288086, 4.178517818450928, 6.735668182373047, 9.292818069458008, 11.849968910217285, 14.407119750976562, 16.964269638061523]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 7.0, 7.0, 11.0, 7.0, 10.0, 9.0, 7.0, 13.0, 16.0, 21.0, 26.0, 25.0, 23.0, 30.0, 40.0, 31.0, 31.0, 37.0, 36.0, 39.0, 47.0, 41.0, 34.0, 41.0, 41.0, 38.0, 31.0, 32.0, 35.0, 33.0, 23.0, 26.0, 23.0, 12.0, 16.0, 14.0, 20.0, 16.0, 8.0, 10.0, 5.0, 9.0, 5.0, 4.0, 5.0, 1.0, 2.0, 2.0, 4.0, 0.0, 0.0, 2.0, 3.0], "bins": [-48.311767578125, -46.86762237548828, -45.4234733581543, -43.97932434082031, -42.535179138183594, -41.091033935546875, -39.64688491821289, -38.202735900878906, -36.75859069824219, -35.31444549560547, -33.870296478271484, -32.4261474609375, -30.98200225830078, -29.53785514831543, -28.093708038330078, -26.649560928344727, -25.205413818359375, -23.761266708374023, -22.317119598388672, -20.87297248840332, -19.42882537841797, -17.984678268432617, -16.540531158447266, -15.096384048461914, -13.652236938476562, -12.208089828491211, -10.76394271850586, -9.319795608520508, -7.875648498535156, -6.431501388549805, -4.987354278564453, -3.5432071685791016, -2.09906005859375, -0.6549129486083984, 0.7892341613769531, 2.2333812713623047, 3.6775283813476562, 5.121675491333008, 6.565822601318359, 8.009969711303711, 9.454116821289062, 10.898263931274414, 12.342411041259766, 13.786558151245117, 15.230705261230469, 16.67485237121582, 18.118999481201172, 19.563146591186523, 21.007293701171875, 22.451440811157227, 23.895587921142578, 25.33973503112793, 26.78388214111328, 28.228029251098633, 29.672176361083984, 31.116323471069336, 32.56047058105469, 34.004615783691406, 35.44876480102539, 36.892913818359375, 38.337059020996094, 39.78120422363281, 41.2253532409668, 42.66950225830078, 44.1136474609375]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 8.0, 5.0, 12.0, 11.0, 12.0, 10.0, 3.0, 12.0, 5.0, 21.0, 22.0, 26.0, 30.0, 20.0, 33.0, 39.0, 27.0, 29.0, 38.0, 37.0, 32.0, 42.0, 49.0, 39.0, 54.0, 35.0, 33.0, 31.0, 36.0, 19.0, 29.0, 27.0, 20.0, 18.0, 12.0, 17.0, 16.0, 9.0, 19.0, 9.0, 13.0, 2.0, 6.0, 8.0, 10.0, 3.0, 7.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0], "bins": [-8.15625, -7.90435791015625, -7.6524658203125, -7.40057373046875, -7.148681640625, -6.89678955078125, -6.6448974609375, -6.39300537109375, -6.14111328125, -5.88922119140625, -5.6373291015625, -5.38543701171875, -5.133544921875, -4.88165283203125, -4.6297607421875, -4.37786865234375, -4.1259765625, -3.87408447265625, -3.6221923828125, -3.37030029296875, -3.118408203125, -2.86651611328125, -2.6146240234375, -2.36273193359375, -2.11083984375, -1.85894775390625, -1.6070556640625, -1.35516357421875, -1.103271484375, -0.85137939453125, -0.5994873046875, -0.34759521484375, -0.095703125, 0.15618896484375, 0.4080810546875, 0.65997314453125, 0.911865234375, 1.16375732421875, 1.4156494140625, 1.66754150390625, 1.91943359375, 2.17132568359375, 2.4232177734375, 2.67510986328125, 2.927001953125, 3.17889404296875, 3.4307861328125, 3.68267822265625, 3.9345703125, 4.18646240234375, 4.4383544921875, 4.69024658203125, 4.942138671875, 5.19403076171875, 5.4459228515625, 5.69781494140625, 5.94970703125, 6.20159912109375, 6.4534912109375, 6.70538330078125, 6.957275390625, 7.20916748046875, 7.4610595703125, 7.71295166015625, 7.96484375]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 5.0, 8.0, 11.0, 12.0, 4.0, 14.0, 14.0, 19.0, 27.0, 44.0, 33.0, 58.0, 73.0, 108.0, 144.0, 179.0, 252.0, 362.0, 416.0, 3142.0, 4176288.0, 11109.0, 553.0, 359.0, 258.0, 198.0, 142.0, 105.0, 76.0, 64.0, 35.0, 42.0, 24.0, 21.0, 21.0, 14.0, 8.0, 9.0, 9.0, 8.0, 7.0, 5.0, 1.0, 5.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-149.5, -144.451171875, -139.40234375, -134.353515625, -129.3046875, -124.255859375, -119.20703125, -114.158203125, -109.109375, -104.060546875, -99.01171875, -93.962890625, -88.9140625, -83.865234375, -78.81640625, -73.767578125, -68.71875, -63.669921875, -58.62109375, -53.572265625, -48.5234375, -43.474609375, -38.42578125, -33.376953125, -28.328125, -23.279296875, -18.23046875, -13.181640625, -8.1328125, -3.083984375, 1.96484375, 7.013671875, 12.0625, 17.111328125, 22.16015625, 27.208984375, 32.2578125, 37.306640625, 42.35546875, 47.404296875, 52.453125, 57.501953125, 62.55078125, 67.599609375, 72.6484375, 77.697265625, 82.74609375, 87.794921875, 92.84375, 97.892578125, 102.94140625, 107.990234375, 113.0390625, 118.087890625, 123.13671875, 128.185546875, 133.234375, 138.283203125, 143.33203125, 148.380859375, 153.4296875, 158.478515625, 163.52734375, 168.576171875, 173.625]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 9.0, 9.0, 19.0, 21.0, 24.0, 49.0, 63.0, 94.0, 126.0, 226.0, 384.0, 682.0, 854.0, 585.0, 348.0, 170.0, 129.0, 84.0, 57.0, 32.0, 40.0, 22.0, 12.0, 12.0, 7.0, 5.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.578125, -18.990966796875, -18.40380859375, -17.816650390625, -17.2294921875, -16.642333984375, -16.05517578125, -15.468017578125, -14.880859375, -14.293701171875, -13.70654296875, -13.119384765625, -12.5322265625, -11.945068359375, -11.35791015625, -10.770751953125, -10.18359375, -9.596435546875, -9.00927734375, -8.422119140625, -7.8349609375, -7.247802734375, -6.66064453125, -6.073486328125, -5.486328125, -4.899169921875, -4.31201171875, -3.724853515625, -3.1376953125, -2.550537109375, -1.96337890625, -1.376220703125, -0.7890625, -0.201904296875, 0.38525390625, 0.972412109375, 1.5595703125, 2.146728515625, 2.73388671875, 3.321044921875, 3.908203125, 4.495361328125, 5.08251953125, 5.669677734375, 6.2568359375, 6.843994140625, 7.43115234375, 8.018310546875, 8.60546875, 9.192626953125, 9.77978515625, 10.366943359375, 10.9541015625, 11.541259765625, 12.12841796875, 12.715576171875, 13.302734375, 13.889892578125, 14.47705078125, 15.064208984375, 15.6513671875, 16.238525390625, 16.82568359375, 17.412841796875, 18.0]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 5.0, 6.0, 9.0, 8.0, 10.0, 19.0, 16.0, 18.0, 16.0, 16.0, 28.0, 37.0, 45.0, 52.0, 80.0, 148.0, 465.0, 7015.0, 3826648.0, 356646.0, 2273.0, 315.0, 103.0, 51.0, 47.0, 33.0, 37.0, 29.0, 27.0, 19.0, 10.0, 8.0, 12.0, 7.0, 11.0, 2.0, 2.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-80.875, -78.1650390625, -75.455078125, -72.7451171875, -70.03515625, -67.3251953125, -64.615234375, -61.9052734375, -59.1953125, -56.4853515625, -53.775390625, -51.0654296875, -48.35546875, -45.6455078125, -42.935546875, -40.2255859375, -37.515625, -34.8056640625, -32.095703125, -29.3857421875, -26.67578125, -23.9658203125, -21.255859375, -18.5458984375, -15.8359375, -13.1259765625, -10.416015625, -7.7060546875, -4.99609375, -2.2861328125, 0.423828125, 3.1337890625, 5.84375, 8.5537109375, 11.263671875, 13.9736328125, 16.68359375, 19.3935546875, 22.103515625, 24.8134765625, 27.5234375, 30.2333984375, 32.943359375, 35.6533203125, 38.36328125, 41.0732421875, 43.783203125, 46.4931640625, 49.203125, 51.9130859375, 54.623046875, 57.3330078125, 60.04296875, 62.7529296875, 65.462890625, 68.1728515625, 70.8828125, 73.5927734375, 76.302734375, 79.0126953125, 81.72265625, 84.4326171875, 87.142578125, 89.8525390625, 92.5625]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 20.0, 52.0, 135.0, 229.0, 230.0, 194.0, 85.0, 50.0, 9.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-102.47761535644531, -99.20384216308594, -95.93006896972656, -92.65629577636719, -89.38252258300781, -86.10874938964844, -82.83497619628906, -79.56120300292969, -76.28742980957031, -73.01365661621094, -69.73988342285156, -66.46611022949219, -63.19233703613281, -59.91856384277344, -56.6447868347168, -53.37101364135742, -50.09723663330078, -46.823463439941406, -43.54969024658203, -40.275917053222656, -37.00214385986328, -33.728370666503906, -30.454593658447266, -27.18082046508789, -23.907047271728516, -20.63327407836914, -17.359500885009766, -14.085725784301758, -10.811952590942383, -7.538179397583008, -4.264404296875, -0.990631103515625, 2.2831497192382812, 5.5569233894348145, 8.830697059631348, 12.104471206665039, 15.378244400024414, 18.65201759338379, 21.925792694091797, 25.199565887451172, 28.473339080810547, 31.747112274169922, 35.0208854675293, 38.29466247558594, 41.56843566894531, 44.84220886230469, 48.11598205566406, 51.38975524902344, 54.66352844238281, 57.93730163574219, 61.21107482910156, 64.48484802246094, 67.75862121582031, 71.03239440917969, 74.30616760253906, 77.57994079589844, 80.85371398925781, 84.12748718261719, 87.40126037597656, 90.67503356933594, 93.94880676269531, 97.22257995605469, 100.49635314941406, 103.77012634277344, 107.04390716552734]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 8.0, 3.0, 4.0, 5.0, 13.0, 13.0, 16.0, 19.0, 17.0, 18.0, 22.0, 23.0, 27.0, 36.0, 42.0, 33.0, 54.0, 41.0, 54.0, 42.0, 42.0, 42.0, 49.0, 51.0, 35.0, 28.0, 31.0, 25.0, 32.0, 24.0, 18.0, 29.0, 15.0, 15.0, 14.0, 15.0, 13.0, 11.0, 4.0, 6.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-46.605979919433594, -45.07762908935547, -43.54928207397461, -42.020931243896484, -40.49258041381836, -38.964229583740234, -37.435882568359375, -35.90753173828125, -34.379180908203125, -32.850830078125, -31.322481155395508, -29.794132232666016, -28.26578140258789, -26.7374324798584, -25.209083557128906, -23.68073272705078, -22.15238380432129, -20.624034881591797, -19.095684051513672, -17.56733512878418, -16.038984298706055, -14.510635375976562, -12.982285499572754, -11.453935623168945, -9.925585746765137, -8.397235870361328, -6.8688859939575195, -5.340536594390869, -3.8121867179870605, -2.283836841583252, -0.7554874420166016, 0.772862434387207, 2.3012123107910156, 3.829562187194824, 5.357912063598633, 6.886261463165283, 8.41461181640625, 9.942960739135742, 11.47131061553955, 12.99966049194336, 14.528010368347168, 16.056360244750977, 17.58470916748047, 19.113059997558594, 20.641408920288086, 22.16975975036621, 23.698108673095703, 25.226459503173828, 26.75480842590332, 28.283157348632812, 29.811508178710938, 31.33985710144043, 32.86820602416992, 34.39655685424805, 35.92490768432617, 37.45325469970703, 38.981605529785156, 40.50995635986328, 42.03830337524414, 43.566654205322266, 45.09500503540039, 46.623355865478516, 48.151702880859375, 49.6800537109375, 51.208404541015625]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 4.0, 3.0, 3.0, 5.0, 5.0, 9.0, 9.0, 6.0, 15.0, 16.0, 21.0, 24.0, 27.0, 18.0, 34.0, 29.0, 35.0, 33.0, 41.0, 38.0, 53.0, 43.0, 36.0, 39.0, 44.0, 39.0, 45.0, 47.0, 35.0, 30.0, 36.0, 29.0, 20.0, 20.0, 16.0, 23.0, 16.0, 12.0, 8.0, 6.0, 8.0, 8.0, 4.0, 3.0, 6.0, 4.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.9140625, -8.6273193359375, -8.340576171875, -8.0538330078125, -7.76708984375, -7.4803466796875, -7.193603515625, -6.9068603515625, -6.6201171875, -6.3333740234375, -6.046630859375, -5.7598876953125, -5.47314453125, -5.1864013671875, -4.899658203125, -4.6129150390625, -4.326171875, -4.0394287109375, -3.752685546875, -3.4659423828125, -3.17919921875, -2.8924560546875, -2.605712890625, -2.3189697265625, -2.0322265625, -1.7454833984375, -1.458740234375, -1.1719970703125, -0.88525390625, -0.5985107421875, -0.311767578125, -0.0250244140625, 0.26171875, 0.5484619140625, 0.835205078125, 1.1219482421875, 1.40869140625, 1.6954345703125, 1.982177734375, 2.2689208984375, 2.5556640625, 2.8424072265625, 3.129150390625, 3.4158935546875, 3.70263671875, 3.9893798828125, 4.276123046875, 4.5628662109375, 4.849609375, 5.1363525390625, 5.423095703125, 5.7098388671875, 5.99658203125, 6.2833251953125, 6.570068359375, 6.8568115234375, 7.1435546875, 7.4302978515625, 7.717041015625, 8.0037841796875, 8.29052734375, 8.5772705078125, 8.864013671875, 9.1507568359375, 9.4375]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 4.0, 4.0, 9.0, 13.0, 19.0, 30.0, 39.0, 56.0, 82.0, 127.0, 220.0, 274.0, 389.0, 586.0, 884.0, 1306.0, 1933.0, 2793.0, 4259.0, 6228.0, 9150.0, 14096.0, 20973.0, 32139.0, 49192.0, 74998.0, 110500.0, 148374.0, 161428.0, 132301.0, 93210.0, 62298.0, 40583.0, 26800.0, 17650.0, 11721.0, 7725.0, 5175.0, 3566.0, 2366.0, 1613.0, 1123.0, 714.0, 519.0, 333.0, 236.0, 159.0, 122.0, 75.0, 51.0, 33.0, 33.0, 15.0, 15.0, 10.0, 6.0, 3.0, 4.0, 3.0, 1.0, 2.0], "bins": [-0.72021484375, -0.6971893310546875, -0.674163818359375, -0.6511383056640625, -0.62811279296875, -0.6050872802734375, -0.582061767578125, -0.5590362548828125, -0.5360107421875, -0.5129852294921875, -0.489959716796875, -0.4669342041015625, -0.44390869140625, -0.4208831787109375, -0.397857666015625, -0.3748321533203125, -0.351806640625, -0.3287811279296875, -0.305755615234375, -0.2827301025390625, -0.25970458984375, -0.2366790771484375, -0.213653564453125, -0.1906280517578125, -0.1676025390625, -0.1445770263671875, -0.121551513671875, -0.0985260009765625, -0.07550048828125, -0.0524749755859375, -0.029449462890625, -0.0064239501953125, 0.0166015625, 0.0396270751953125, 0.062652587890625, 0.0856781005859375, 0.10870361328125, 0.1317291259765625, 0.154754638671875, 0.1777801513671875, 0.2008056640625, 0.2238311767578125, 0.246856689453125, 0.2698822021484375, 0.29290771484375, 0.3159332275390625, 0.338958740234375, 0.3619842529296875, 0.385009765625, 0.4080352783203125, 0.431060791015625, 0.4540863037109375, 0.47711181640625, 0.5001373291015625, 0.523162841796875, 0.5461883544921875, 0.5692138671875, 0.5922393798828125, 0.615264892578125, 0.6382904052734375, 0.66131591796875, 0.6843414306640625, 0.707366943359375, 0.7303924560546875, 0.75341796875]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 7.0, 3.0, 6.0, 5.0, 8.0, 9.0, 10.0, 11.0, 16.0, 19.0, 18.0, 24.0, 19.0, 33.0, 43.0, 40.0, 38.0, 46.0, 46.0, 36.0, 52.0, 1063.0, 61.0, 42.0, 44.0, 33.0, 38.0, 34.0, 36.0, 33.0, 24.0, 24.0, 23.0, 18.0, 13.0, 11.0, 10.0, 8.0, 2.0, 11.0, 2.0, 2.0, 5.0, 3.0, 1.0, 4.0, 3.0, 1.0, 1.0], "bins": [-7.29296875, -7.09478759765625, -6.8966064453125, -6.69842529296875, -6.500244140625, -6.30206298828125, -6.1038818359375, -5.90570068359375, -5.70751953125, -5.50933837890625, -5.3111572265625, -5.11297607421875, -4.914794921875, -4.71661376953125, -4.5184326171875, -4.32025146484375, -4.1220703125, -3.92388916015625, -3.7257080078125, -3.52752685546875, -3.329345703125, -3.13116455078125, -2.9329833984375, -2.73480224609375, -2.53662109375, -2.33843994140625, -2.1402587890625, -1.94207763671875, -1.743896484375, -1.54571533203125, -1.3475341796875, -1.14935302734375, -0.951171875, -0.75299072265625, -0.5548095703125, -0.35662841796875, -0.158447265625, 0.03973388671875, 0.2379150390625, 0.43609619140625, 0.63427734375, 0.83245849609375, 1.0306396484375, 1.22882080078125, 1.427001953125, 1.62518310546875, 1.8233642578125, 2.02154541015625, 2.2197265625, 2.41790771484375, 2.6160888671875, 2.81427001953125, 3.012451171875, 3.21063232421875, 3.4088134765625, 3.60699462890625, 3.80517578125, 4.00335693359375, 4.2015380859375, 4.39971923828125, 4.597900390625, 4.79608154296875, 4.9942626953125, 5.19244384765625, 5.390625]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 8.0, 14.0, 22.0, 29.0, 42.0, 91.0, 137.0, 201.0, 328.0, 559.0, 882.0, 1479.0, 2350.0, 3786.0, 6270.0, 9840.0, 15555.0, 24569.0, 38407.0, 60681.0, 92453.0, 130781.0, 1206477.0, 158106.0, 118844.0, 81881.0, 52651.0, 33791.0, 21154.0, 13419.0, 8306.0, 5426.0, 3288.0, 2038.0, 1281.0, 754.0, 502.0, 286.0, 173.0, 115.0, 61.0, 37.0, 26.0, 11.0, 11.0, 4.0, 2.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.64599609375, -0.6257095336914062, -0.6054229736328125, -0.5851364135742188, -0.564849853515625, -0.5445632934570312, -0.5242767333984375, -0.5039901733398438, -0.48370361328125, -0.46341705322265625, -0.4431304931640625, -0.42284393310546875, -0.402557373046875, -0.38227081298828125, -0.3619842529296875, -0.34169769287109375, -0.3214111328125, -0.30112457275390625, -0.2808380126953125, -0.26055145263671875, -0.240264892578125, -0.21997833251953125, -0.1996917724609375, -0.17940521240234375, -0.15911865234375, -0.13883209228515625, -0.1185455322265625, -0.09825897216796875, -0.077972412109375, -0.05768585205078125, -0.0373992919921875, -0.01711273193359375, 0.003173828125, 0.02346038818359375, 0.0437469482421875, 0.06403350830078125, 0.084320068359375, 0.10460662841796875, 0.1248931884765625, 0.14517974853515625, 0.16546630859375, 0.18575286865234375, 0.2060394287109375, 0.22632598876953125, 0.246612548828125, 0.26689910888671875, 0.2871856689453125, 0.30747222900390625, 0.3277587890625, 0.34804534912109375, 0.3683319091796875, 0.38861846923828125, 0.408905029296875, 0.42919158935546875, 0.4494781494140625, 0.46976470947265625, 0.49005126953125, 0.5103378295898438, 0.5306243896484375, 0.5509109497070312, 0.571197509765625, 0.5914840698242188, 0.6117706298828125, 0.6320571899414062, 0.65234375]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 3.0, 9.0, 9.0, 4.0, 3.0, 11.0, 10.0, 12.0, 18.0, 9.0, 18.0, 20.0, 31.0, 33.0, 29.0, 35.0, 27.0, 53.0, 62.0, 59.0, 60.0, 64.0, 53.0, 68.0, 44.0, 38.0, 43.0, 22.0, 26.0, 21.0, 22.0, 18.0, 6.0, 14.0, 8.0, 8.0, 4.0, 1.0, 9.0, 4.0, 3.0, 1.0, 7.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.0036296844482421875, -0.0035242438316345215, -0.0034188032150268555, -0.0033133625984191895, -0.0032079219818115234, -0.0031024813652038574, -0.0029970407485961914, -0.0028916001319885254, -0.0027861595153808594, -0.0026807188987731934, -0.0025752782821655273, -0.0024698376655578613, -0.0023643970489501953, -0.0022589564323425293, -0.0021535158157348633, -0.0020480751991271973, -0.0019426345825195312, -0.0018371939659118652, -0.0017317533493041992, -0.0016263127326965332, -0.0015208721160888672, -0.0014154314994812012, -0.0013099908828735352, -0.0012045502662658691, -0.0010991096496582031, -0.0009936690330505371, -0.0008882284164428711, -0.0007827877998352051, -0.0006773471832275391, -0.000571906566619873, -0.00046646595001220703, -0.000361025333404541, -0.000255584716796875, -0.00015014410018920898, -4.470348358154297e-05, 6.073713302612305e-05, 0.00016617774963378906, 0.0002716183662414551, 0.0003770589828491211, 0.0004824995994567871, 0.0005879402160644531, 0.0006933808326721191, 0.0007988214492797852, 0.0009042620658874512, 0.0010097026824951172, 0.0011151432991027832, 0.0012205839157104492, 0.0013260245323181152, 0.0014314651489257812, 0.0015369057655334473, 0.0016423463821411133, 0.0017477869987487793, 0.0018532276153564453, 0.0019586682319641113, 0.0020641088485717773, 0.0021695494651794434, 0.0022749900817871094, 0.0023804306983947754, 0.0024858713150024414, 0.0025913119316101074, 0.0026967525482177734, 0.0028021931648254395, 0.0029076337814331055, 0.0030130743980407715, 0.0031185150146484375]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 3.0, 1.0, 6.0, 4.0, 5.0, 8.0, 8.0, 12.0, 6.0, 8.0, 9.0, 16.0, 17.0, 16.0, 28.0, 49.0, 58.0, 60.0, 95.0, 118.0, 143.0, 209.0, 380.0, 636.0, 2082.0, 183891.0, 852706.0, 5818.0, 755.0, 423.0, 270.0, 159.0, 107.0, 98.0, 68.0, 53.0, 43.0, 32.0, 34.0, 27.0, 18.0, 19.0, 12.0, 8.0, 13.0, 10.0, 6.0, 7.0, 2.0, 3.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.057952880859375, -0.05596590042114258, -0.053978919982910156, -0.051991939544677734, -0.05000495910644531, -0.04801797866821289, -0.04603099822998047, -0.04404401779174805, -0.042057037353515625, -0.0400700569152832, -0.03808307647705078, -0.03609609603881836, -0.03410911560058594, -0.032122135162353516, -0.030135154724121094, -0.028148174285888672, -0.02616119384765625, -0.024174213409423828, -0.022187232971191406, -0.020200252532958984, -0.018213272094726562, -0.01622629165649414, -0.014239311218261719, -0.012252330780029297, -0.010265350341796875, -0.008278369903564453, -0.006291389465332031, -0.004304409027099609, -0.0023174285888671875, -0.0003304481506347656, 0.0016565322875976562, 0.003643512725830078, 0.0056304931640625, 0.007617473602294922, 0.009604454040527344, 0.011591434478759766, 0.013578414916992188, 0.01556539535522461, 0.01755237579345703, 0.019539356231689453, 0.021526336669921875, 0.023513317108154297, 0.02550029754638672, 0.02748727798461914, 0.029474258422851562, 0.031461238861083984, 0.033448219299316406, 0.03543519973754883, 0.03742218017578125, 0.03940916061401367, 0.041396141052246094, 0.043383121490478516, 0.04537010192871094, 0.04735708236694336, 0.04934406280517578, 0.0513310432434082, 0.053318023681640625, 0.05530500411987305, 0.05729198455810547, 0.05927896499633789, 0.06126594543457031, 0.06325292587280273, 0.06523990631103516, 0.06722688674926758, 0.0692138671875]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 11.0, 56.0, 357.0, 415.0, 129.0, 36.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01804562658071518, -0.01769249700009823, -0.017339367419481277, -0.016986237838864326, -0.016633108258247375, -0.016279976814985275, -0.015926849097013474, -0.015573718585073948, -0.015220588073134422, -0.014867458492517471, -0.01451432891190052, -0.01416119933128357, -0.013808068819344044, -0.013454939238727093, -0.013101809658110142, -0.01274868007749319, -0.01239555049687624, -0.012042420916259289, -0.011689291335642338, -0.011336160823702812, -0.010983031243085861, -0.01062990166246891, -0.01027677208185196, -0.009923642501235008, -0.009570512920618057, -0.009217383340001106, -0.008864253759384155, -0.008511124178767204, -0.008157993666827679, -0.007804864086210728, -0.007451734505593777, -0.007098604924976826, -0.006745473947376013, -0.006392344366759062, -0.0060392143204808235, -0.0056860847398638725, -0.0053329551592469215, -0.004979825112968683, -0.004626695532351732, -0.004273565486073494, -0.003920435905456543, -0.0035673060920089483, -0.0032141762785613537, -0.0028610466979444027, -0.002507916884496808, -0.0021547870710492134, -0.0018016574904322624, -0.0014485276769846678, -0.0010953978635370731, -0.0007422681082971394, -0.0003891383530572057, -3.600865602493286e-05, 0.0003171211574226618, 0.0006702509708702564, 0.0010233805514872074, 0.001376510364934802, 0.0017296401783823967, 0.0020827699918299913, 0.002435899805277586, 0.002789029385894537, 0.0031421591993421316, 0.0034952890127897263, 0.0038484185934066772, 0.004201548174023628, 0.0045546782203018665]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 8.0, 7.0, 6.0, 10.0, 5.0, 11.0, 15.0, 14.0, 21.0, 15.0, 14.0, 27.0, 10.0, 33.0, 30.0, 29.0, 33.0, 33.0, 23.0, 48.0, 34.0, 39.0, 34.0, 33.0, 35.0, 34.0, 36.0, 44.0, 38.0, 36.0, 25.0, 30.0, 20.0, 20.0, 24.0, 24.0, 15.0, 18.0, 18.0, 11.0, 8.0, 11.0, 5.0, 2.0, 7.0, 3.0, 6.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0018517374992370605, -0.0017941063269972801, -0.0017364751547574997, -0.0016788439825177193, -0.0016212128102779388, -0.0015635816380381584, -0.001505950465798378, -0.0014483192935585976, -0.0013906881213188171, -0.0013330569490790367, -0.0012754257768392563, -0.0012177946045994759, -0.0011601634323596954, -0.001102532260119915, -0.0010449010878801346, -0.0009872699156403542, -0.0009296387434005737, -0.0008720075711607933, -0.0008143763989210129, -0.0007567452266812325, -0.000699114054441452, -0.0006414828822016716, -0.0005838517099618912, -0.0005262205377221107, -0.0004685893654823303, -0.0004109581932425499, -0.00035332702100276947, -0.00029569584876298904, -0.00023806467652320862, -0.0001804335042834282, -0.00012280233204364777, -6.517115980386734e-05, -7.539987564086914e-06, 5.009118467569351e-05, 0.00010772235691547394, 0.00016535352915525436, 0.0002229847013950348, 0.0002806158736348152, 0.00033824704587459564, 0.00039587821811437607, 0.0004535093903541565, 0.0005111405625939369, 0.0005687717348337173, 0.0006264029070734978, 0.0006840340793132782, 0.0007416652515530586, 0.000799296423792839, 0.0008569275960326195, 0.0009145587682723999, 0.0009721899405121803, 0.0010298211127519608, 0.0010874522849917412, 0.0011450834572315216, 0.001202714629471302, 0.0012603458017110825, 0.0013179769739508629, 0.0013756081461906433, 0.0014332393184304237, 0.0014908704906702042, 0.0015485016629099846, 0.001606132835149765, 0.0016637640073895454, 0.0017213951796293259, 0.0017790263518691063, 0.0018366575241088867]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 4.0, 3.0, 3.0, 5.0, 5.0, 9.0, 9.0, 6.0, 15.0, 16.0, 21.0, 24.0, 27.0, 18.0, 34.0, 29.0, 35.0, 33.0, 41.0, 38.0, 53.0, 43.0, 36.0, 39.0, 44.0, 39.0, 45.0, 47.0, 35.0, 30.0, 36.0, 29.0, 20.0, 20.0, 16.0, 23.0, 16.0, 12.0, 8.0, 6.0, 8.0, 8.0, 4.0, 3.0, 6.0, 4.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.9140625, -8.6273193359375, -8.340576171875, -8.0538330078125, -7.76708984375, -7.4803466796875, -7.193603515625, -6.9068603515625, -6.6201171875, -6.3333740234375, -6.046630859375, -5.7598876953125, -5.47314453125, -5.1864013671875, -4.899658203125, -4.6129150390625, -4.326171875, -4.0394287109375, -3.752685546875, -3.4659423828125, -3.17919921875, -2.8924560546875, -2.605712890625, -2.3189697265625, -2.0322265625, -1.7454833984375, -1.458740234375, -1.1719970703125, -0.88525390625, -0.5985107421875, -0.311767578125, -0.0250244140625, 0.26171875, 0.5484619140625, 0.835205078125, 1.1219482421875, 1.40869140625, 1.6954345703125, 1.982177734375, 2.2689208984375, 2.5556640625, 2.8424072265625, 3.129150390625, 3.4158935546875, 3.70263671875, 3.9893798828125, 4.276123046875, 4.5628662109375, 4.849609375, 5.1363525390625, 5.423095703125, 5.7098388671875, 5.99658203125, 6.2833251953125, 6.570068359375, 6.8568115234375, 7.1435546875, 7.4302978515625, 7.717041015625, 8.0037841796875, 8.29052734375, 8.5772705078125, 8.864013671875, 9.1507568359375, 9.4375]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 6.0, 6.0, 5.0, 15.0, 12.0, 19.0, 19.0, 20.0, 41.0, 50.0, 81.0, 95.0, 148.0, 188.0, 222.0, 262.0, 406.0, 609.0, 756.0, 1159.0, 1853.0, 3643.0, 9085.0, 31994.0, 156486.0, 578455.0, 201604.0, 40311.0, 10594.0, 4043.0, 1997.0, 1270.0, 838.0, 623.0, 433.0, 282.0, 213.0, 177.0, 128.0, 104.0, 86.0, 54.0, 40.0, 35.0, 23.0, 21.0, 8.0, 12.0, 9.0, 8.0, 6.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-15.359375, -14.8729248046875, -14.386474609375, -13.9000244140625, -13.41357421875, -12.9271240234375, -12.440673828125, -11.9542236328125, -11.4677734375, -10.9813232421875, -10.494873046875, -10.0084228515625, -9.52197265625, -9.0355224609375, -8.549072265625, -8.0626220703125, -7.576171875, -7.0897216796875, -6.603271484375, -6.1168212890625, -5.63037109375, -5.1439208984375, -4.657470703125, -4.1710205078125, -3.6845703125, -3.1981201171875, -2.711669921875, -2.2252197265625, -1.73876953125, -1.2523193359375, -0.765869140625, -0.2794189453125, 0.20703125, 0.6934814453125, 1.179931640625, 1.6663818359375, 2.15283203125, 2.6392822265625, 3.125732421875, 3.6121826171875, 4.0986328125, 4.5850830078125, 5.071533203125, 5.5579833984375, 6.04443359375, 6.5308837890625, 7.017333984375, 7.5037841796875, 7.990234375, 8.4766845703125, 8.963134765625, 9.4495849609375, 9.93603515625, 10.4224853515625, 10.908935546875, 11.3953857421875, 11.8818359375, 12.3682861328125, 12.854736328125, 13.3411865234375, 13.82763671875, 14.3140869140625, 14.800537109375, 15.2869873046875, 15.7734375]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 6.0, 2.0, 6.0, 3.0, 5.0, 14.0, 15.0, 5.0, 16.0, 17.0, 25.0, 23.0, 37.0, 34.0, 46.0, 34.0, 66.0, 83.0, 163.0, 1496.0, 371.0, 123.0, 64.0, 53.0, 46.0, 40.0, 28.0, 29.0, 31.0, 33.0, 26.0, 20.0, 21.0, 12.0, 11.0, 12.0, 5.0, 7.0, 10.0, 11.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.96875, -21.28076171875, -20.5927734375, -19.90478515625, -19.216796875, -18.52880859375, -17.8408203125, -17.15283203125, -16.46484375, -15.77685546875, -15.0888671875, -14.40087890625, -13.712890625, -13.02490234375, -12.3369140625, -11.64892578125, -10.9609375, -10.27294921875, -9.5849609375, -8.89697265625, -8.208984375, -7.52099609375, -6.8330078125, -6.14501953125, -5.45703125, -4.76904296875, -4.0810546875, -3.39306640625, -2.705078125, -2.01708984375, -1.3291015625, -0.64111328125, 0.046875, 0.73486328125, 1.4228515625, 2.11083984375, 2.798828125, 3.48681640625, 4.1748046875, 4.86279296875, 5.55078125, 6.23876953125, 6.9267578125, 7.61474609375, 8.302734375, 8.99072265625, 9.6787109375, 10.36669921875, 11.0546875, 11.74267578125, 12.4306640625, 13.11865234375, 13.806640625, 14.49462890625, 15.1826171875, 15.87060546875, 16.55859375, 17.24658203125, 17.9345703125, 18.62255859375, 19.310546875, 19.99853515625, 20.6865234375, 21.37451171875, 22.0625]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 8.0, 6.0, 0.0, 6.0, 7.0, 10.0, 7.0, 12.0, 15.0, 12.0, 29.0, 20.0, 34.0, 33.0, 54.0, 83.0, 131.0, 203.0, 407.0, 788.0, 3044.0, 3091129.0, 47132.0, 1279.0, 506.0, 275.0, 138.0, 102.0, 61.0, 37.0, 38.0, 19.0, 23.0, 11.0, 9.0, 9.0, 5.0, 2.0, 4.0, 10.0, 5.0, 1.0, 2.0, 3.0, 4.0, 0.0, 0.0, 4.0], "bins": [-102.3125, -99.6015625, -96.890625, -94.1796875, -91.46875, -88.7578125, -86.046875, -83.3359375, -80.625, -77.9140625, -75.203125, -72.4921875, -69.78125, -67.0703125, -64.359375, -61.6484375, -58.9375, -56.2265625, -53.515625, -50.8046875, -48.09375, -45.3828125, -42.671875, -39.9609375, -37.25, -34.5390625, -31.828125, -29.1171875, -26.40625, -23.6953125, -20.984375, -18.2734375, -15.5625, -12.8515625, -10.140625, -7.4296875, -4.71875, -2.0078125, 0.703125, 3.4140625, 6.125, 8.8359375, 11.546875, 14.2578125, 16.96875, 19.6796875, 22.390625, 25.1015625, 27.8125, 30.5234375, 33.234375, 35.9453125, 38.65625, 41.3671875, 44.078125, 46.7890625, 49.5, 52.2109375, 54.921875, 57.6328125, 60.34375, 63.0546875, 65.765625, 68.4765625, 71.1875]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 18.0, 597.0, 395.0, 7.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-222.3544921875, -212.21298217773438, -202.07147216796875, -191.92994689941406, -181.78843688964844, -171.6469268798828, -161.50540161132812, -151.3638916015625, -141.22238159179688, -131.08087158203125, -120.9393539428711, -110.79783630371094, -100.65632629394531, -90.51481628417969, -80.37329864501953, -70.23178100585938, -60.09027099609375, -49.94875717163086, -39.80724334716797, -29.665729522705078, -19.524215698242188, -9.382701873779297, 0.7588119506835938, 10.90032958984375, 21.041839599609375, 31.183353424072266, 41.324867248535156, 51.46638107299805, 61.60789489746094, 71.74940490722656, 81.89092254638672, 92.03244018554688, 102.1739501953125, 112.31546020507812, 122.45697784423828, 132.59849548339844, 142.74000549316406, 152.8815155029297, 163.02304077148438, 173.16455078125, 183.30606079101562, 193.44757080078125, 203.58908081054688, 213.73060607910156, 223.8721160888672, 234.0136260986328, 244.1551513671875, 254.29666137695312, 264.43817138671875, 274.5796813964844, 284.72119140625, 294.8627014160156, 305.00421142578125, 315.145751953125, 325.2872619628906, 335.42877197265625, 345.5702819824219, 355.7117919921875, 365.8533020019531, 375.99481201171875, 386.1363525390625, 396.2778625488281, 406.41937255859375, 416.5608825683594, 426.702392578125]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 6.0, 4.0, 4.0, 3.0, 12.0, 5.0, 9.0, 8.0, 16.0, 16.0, 21.0, 15.0, 22.0, 26.0, 29.0, 32.0, 28.0, 28.0, 40.0, 32.0, 44.0, 41.0, 39.0, 35.0, 47.0, 47.0, 38.0, 50.0, 40.0, 29.0, 33.0, 32.0, 18.0, 27.0, 21.0, 26.0, 6.0, 6.0, 11.0, 21.0, 7.0, 5.0, 7.0, 6.0, 3.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-59.22264862060547, -57.51224899291992, -55.80184555053711, -54.09144592285156, -52.381046295166016, -50.67064666748047, -48.960243225097656, -47.24984359741211, -45.53944396972656, -43.829044342041016, -42.1186408996582, -40.408241271972656, -38.69784164428711, -36.98744201660156, -35.27703857421875, -33.5666389465332, -31.856237411499023, -30.145835876464844, -28.435436248779297, -26.725034713745117, -25.01463508605957, -23.30423355102539, -21.593833923339844, -19.883432388305664, -18.173030853271484, -16.462629318237305, -14.752229690551758, -13.041828155517578, -11.331428527832031, -9.621026992797852, -7.910626411437988, -6.200225830078125, -4.489826202392578, -2.779425621032715, -1.0690248012542725, 0.6413760185241699, 2.351776599884033, 4.062177658081055, 5.772578239440918, 7.482978820800781, 9.193379402160645, 10.903779983520508, 12.614180564880371, 14.324581146240234, 16.034982681274414, 17.745384216308594, 19.45578384399414, 21.166183471679688, 22.876585006713867, 24.586986541748047, 26.297386169433594, 28.007787704467773, 29.71818733215332, 31.4285888671875, 33.13898849487305, 34.849388122558594, 36.559791564941406, 38.27019119262695, 39.980594635009766, 41.69099426269531, 43.40139389038086, 45.111793518066406, 46.82219696044922, 48.532596588134766, 50.24299621582031]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 5.0, 4.0, 8.0, 6.0, 5.0, 13.0, 13.0, 19.0, 21.0, 32.0, 28.0, 30.0, 30.0, 38.0, 35.0, 46.0, 37.0, 38.0, 50.0, 43.0, 47.0, 40.0, 43.0, 40.0, 42.0, 38.0, 28.0, 34.0, 27.0, 22.0, 22.0, 33.0, 14.0, 10.0, 14.0, 9.0, 4.0, 6.0, 9.0, 5.0, 7.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.90625, -8.6092529296875, -8.312255859375, -8.0152587890625, -7.71826171875, -7.4212646484375, -7.124267578125, -6.8272705078125, -6.5302734375, -6.2332763671875, -5.936279296875, -5.6392822265625, -5.34228515625, -5.0452880859375, -4.748291015625, -4.4512939453125, -4.154296875, -3.8572998046875, -3.560302734375, -3.2633056640625, -2.96630859375, -2.6693115234375, -2.372314453125, -2.0753173828125, -1.7783203125, -1.4813232421875, -1.184326171875, -0.8873291015625, -0.59033203125, -0.2933349609375, 0.003662109375, 0.3006591796875, 0.59765625, 0.8946533203125, 1.191650390625, 1.4886474609375, 1.78564453125, 2.0826416015625, 2.379638671875, 2.6766357421875, 2.9736328125, 3.2706298828125, 3.567626953125, 3.8646240234375, 4.16162109375, 4.4586181640625, 4.755615234375, 5.0526123046875, 5.349609375, 5.6466064453125, 5.943603515625, 6.2406005859375, 6.53759765625, 6.8345947265625, 7.131591796875, 7.4285888671875, 7.7255859375, 8.0225830078125, 8.319580078125, 8.6165771484375, 8.91357421875, 9.2105712890625, 9.507568359375, 9.8045654296875, 10.1015625]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 7.0, 9.0, 10.0, 18.0, 21.0, 23.0, 34.0, 35.0, 45.0, 73.0, 86.0, 114.0, 167.0, 271.0, 416.0, 731.0, 1479.0, 3544.0, 9594.0, 43353.0, 379417.0, 2308499.0, 1278850.0, 136095.0, 20314.0, 5980.0, 2284.0, 1134.0, 566.0, 320.0, 221.0, 135.0, 111.0, 76.0, 57.0, 49.0, 33.0, 26.0, 18.0, 19.0, 10.0, 10.0, 8.0, 3.0, 6.0, 4.0, 6.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-17.96875, -17.420654296875, -16.87255859375, -16.324462890625, -15.7763671875, -15.228271484375, -14.68017578125, -14.132080078125, -13.583984375, -13.035888671875, -12.48779296875, -11.939697265625, -11.3916015625, -10.843505859375, -10.29541015625, -9.747314453125, -9.19921875, -8.651123046875, -8.10302734375, -7.554931640625, -7.0068359375, -6.458740234375, -5.91064453125, -5.362548828125, -4.814453125, -4.266357421875, -3.71826171875, -3.170166015625, -2.6220703125, -2.073974609375, -1.52587890625, -0.977783203125, -0.4296875, 0.118408203125, 0.66650390625, 1.214599609375, 1.7626953125, 2.310791015625, 2.85888671875, 3.406982421875, 3.955078125, 4.503173828125, 5.05126953125, 5.599365234375, 6.1474609375, 6.695556640625, 7.24365234375, 7.791748046875, 8.33984375, 8.887939453125, 9.43603515625, 9.984130859375, 10.5322265625, 11.080322265625, 11.62841796875, 12.176513671875, 12.724609375, 13.272705078125, 13.82080078125, 14.368896484375, 14.9169921875, 15.465087890625, 16.01318359375, 16.561279296875, 17.109375]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 6.0, 5.0, 12.0, 13.0, 23.0, 33.0, 38.0, 66.0, 97.0, 134.0, 191.0, 237.0, 504.0, 648.0, 675.0, 433.0, 292.0, 190.0, 141.0, 105.0, 64.0, 48.0, 35.0, 23.0, 20.0, 22.0, 10.0, 5.0, 5.0, 4.0, 1.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-24.03125, -23.4305419921875, -22.829833984375, -22.2291259765625, -21.62841796875, -21.0277099609375, -20.427001953125, -19.8262939453125, -19.2255859375, -18.6248779296875, -18.024169921875, -17.4234619140625, -16.82275390625, -16.2220458984375, -15.621337890625, -15.0206298828125, -14.419921875, -13.8192138671875, -13.218505859375, -12.6177978515625, -12.01708984375, -11.4163818359375, -10.815673828125, -10.2149658203125, -9.6142578125, -9.0135498046875, -8.412841796875, -7.8121337890625, -7.21142578125, -6.6107177734375, -6.010009765625, -5.4093017578125, -4.80859375, -4.2078857421875, -3.607177734375, -3.0064697265625, -2.40576171875, -1.8050537109375, -1.204345703125, -0.6036376953125, -0.0029296875, 0.5977783203125, 1.198486328125, 1.7991943359375, 2.39990234375, 3.0006103515625, 3.601318359375, 4.2020263671875, 4.802734375, 5.4034423828125, 6.004150390625, 6.6048583984375, 7.20556640625, 7.8062744140625, 8.406982421875, 9.0076904296875, 9.6083984375, 10.2091064453125, 10.809814453125, 11.4105224609375, 12.01123046875, 12.6119384765625, 13.212646484375, 13.8133544921875, 14.4140625]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 10.0, 8.0, 13.0, 17.0, 40.0, 69.0, 100.0, 177.0, 423.0, 799.0, 2374.0, 15468.0, 619857.0, 3490822.0, 57609.0, 4299.0, 1219.0, 461.0, 225.0, 130.0, 67.0, 45.0, 23.0, 7.0, 9.0, 8.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.3125, -42.00830078125, -40.7041015625, -39.39990234375, -38.095703125, -36.79150390625, -35.4873046875, -34.18310546875, -32.87890625, -31.57470703125, -30.2705078125, -28.96630859375, -27.662109375, -26.35791015625, -25.0537109375, -23.74951171875, -22.4453125, -21.14111328125, -19.8369140625, -18.53271484375, -17.228515625, -15.92431640625, -14.6201171875, -13.31591796875, -12.01171875, -10.70751953125, -9.4033203125, -8.09912109375, -6.794921875, -5.49072265625, -4.1865234375, -2.88232421875, -1.578125, -0.27392578125, 1.0302734375, 2.33447265625, 3.638671875, 4.94287109375, 6.2470703125, 7.55126953125, 8.85546875, 10.15966796875, 11.4638671875, 12.76806640625, 14.072265625, 15.37646484375, 16.6806640625, 17.98486328125, 19.2890625, 20.59326171875, 21.8974609375, 23.20166015625, 24.505859375, 25.81005859375, 27.1142578125, 28.41845703125, 29.72265625, 31.02685546875, 32.3310546875, 33.63525390625, 34.939453125, 36.24365234375, 37.5478515625, 38.85205078125, 40.15625]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 70.0, 849.0, 93.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-848.4249267578125, -831.959228515625, -815.4935302734375, -799.02783203125, -782.5621337890625, -766.096435546875, -749.6307373046875, -733.1650390625, -716.6993408203125, -700.233642578125, -683.7679443359375, -667.30224609375, -650.8365478515625, -634.370849609375, -617.9051513671875, -601.439453125, -584.9736938476562, -568.5079956054688, -552.0422973632812, -535.5765991210938, -519.1109008789062, -502.64520263671875, -486.1794738769531, -469.7137756347656, -453.2480773925781, -436.7823791503906, -420.3166809082031, -403.8509826660156, -387.38525390625, -370.9195556640625, -354.453857421875, -337.9881591796875, -321.5224609375, -305.0567626953125, -288.591064453125, -272.1253662109375, -255.65965270996094, -239.19395446777344, -222.72824096679688, -206.26254272460938, -189.79684448242188, -173.33114624023438, -156.86544799804688, -140.3997344970703, -123.93403625488281, -107.46833801269531, -91.00263214111328, -74.53692626953125, -58.07122802734375, -41.605525970458984, -25.13982391357422, -8.674121856689453, 7.7915802001953125, 24.257278442382812, 40.722984313964844, 57.188690185546875, 73.65438842773438, 90.12008666992188, 106.5857925415039, 123.05149841308594, 139.51719665527344, 155.98289489746094, 172.4486083984375, 188.914306640625, 205.3800048828125]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 4.0, 5.0, 3.0, 5.0, 13.0, 16.0, 18.0, 16.0, 18.0, 28.0, 23.0, 28.0, 38.0, 39.0, 37.0, 37.0, 37.0, 40.0, 39.0, 47.0, 52.0, 46.0, 37.0, 32.0, 46.0, 38.0, 39.0, 37.0, 24.0, 25.0, 23.0, 21.0, 16.0, 20.0, 7.0, 7.0, 12.0, 9.0, 3.0, 7.0, 2.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-54.67823028564453, -52.84877395629883, -51.01932144165039, -49.18986511230469, -47.360408782958984, -45.53095626831055, -43.701499938964844, -41.872047424316406, -40.0425910949707, -38.213134765625, -36.38368225097656, -34.55422592163086, -32.724769592285156, -30.89531707763672, -29.065860748291016, -27.236406326293945, -25.406949996948242, -23.577495574951172, -21.74803924560547, -19.9185848236084, -18.089130401611328, -16.259674072265625, -14.430219650268555, -12.600765228271484, -10.771309852600098, -8.941854476928711, -7.112400054931641, -5.282944679260254, -3.4534897804260254, -1.6240348815917969, 0.20542049407958984, 2.03487491607666, 3.864330291748047, 5.693785190582275, 7.523240089416504, 9.35269546508789, 11.182149887084961, 13.011605262756348, 14.841060638427734, 16.670515060424805, 18.499969482421875, 20.329423904418945, 22.15888023376465, 23.98833465576172, 25.81778907775879, 27.64724349975586, 29.476699829101562, 31.306154251098633, 33.13561248779297, 34.96506881713867, 36.79452133178711, 38.62397766113281, 40.453433990478516, 42.28288650512695, 44.112342834472656, 45.941795349121094, 47.7712516784668, 49.6007080078125, 51.43016052246094, 53.25961685180664, 55.089073181152344, 56.91852569580078, 58.747982025146484, 60.57743835449219, 62.406890869140625]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 9.0, 11.0, 10.0, 15.0, 24.0, 15.0, 21.0, 32.0, 26.0, 40.0, 36.0, 43.0, 28.0, 43.0, 41.0, 33.0, 41.0, 31.0, 45.0, 53.0, 46.0, 33.0, 43.0, 41.0, 24.0, 37.0, 40.0, 22.0, 17.0, 14.0, 12.0, 13.0, 11.0, 11.0, 11.0, 6.0, 4.0, 7.0, 4.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.625, -6.3929443359375, -6.160888671875, -5.9288330078125, -5.69677734375, -5.4647216796875, -5.232666015625, -5.0006103515625, -4.7685546875, -4.5364990234375, -4.304443359375, -4.0723876953125, -3.84033203125, -3.6082763671875, -3.376220703125, -3.1441650390625, -2.912109375, -2.6800537109375, -2.447998046875, -2.2159423828125, -1.98388671875, -1.7518310546875, -1.519775390625, -1.2877197265625, -1.0556640625, -0.8236083984375, -0.591552734375, -0.3594970703125, -0.12744140625, 0.1046142578125, 0.336669921875, 0.5687255859375, 0.80078125, 1.0328369140625, 1.264892578125, 1.4969482421875, 1.72900390625, 1.9610595703125, 2.193115234375, 2.4251708984375, 2.6572265625, 2.8892822265625, 3.121337890625, 3.3533935546875, 3.58544921875, 3.8175048828125, 4.049560546875, 4.2816162109375, 4.513671875, 4.7457275390625, 4.977783203125, 5.2098388671875, 5.44189453125, 5.6739501953125, 5.906005859375, 6.1380615234375, 6.3701171875, 6.6021728515625, 6.834228515625, 7.0662841796875, 7.29833984375, 7.5303955078125, 7.762451171875, 7.9945068359375, 8.2265625]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 0.0, 4.0, 8.0, 8.0, 19.0, 29.0, 36.0, 53.0, 76.0, 143.0, 215.0, 320.0, 550.0, 879.0, 1376.0, 2149.0, 3522.0, 5771.0, 9553.0, 15674.0, 26178.0, 44056.0, 74336.0, 122980.0, 186681.0, 199791.0, 140671.0, 86098.0, 50774.0, 30443.0, 17992.0, 10947.0, 6560.0, 4122.0, 2444.0, 1525.0, 984.0, 573.0, 333.0, 249.0, 143.0, 108.0, 63.0, 43.0, 28.0, 19.0, 13.0, 11.0, 4.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.73681640625, -0.7138900756835938, -0.6909637451171875, -0.6680374145507812, -0.645111083984375, -0.6221847534179688, -0.5992584228515625, -0.5763320922851562, -0.55340576171875, -0.5304794311523438, -0.5075531005859375, -0.48462677001953125, -0.461700439453125, -0.43877410888671875, -0.4158477783203125, -0.39292144775390625, -0.3699951171875, -0.34706878662109375, -0.3241424560546875, -0.30121612548828125, -0.278289794921875, -0.25536346435546875, -0.2324371337890625, -0.20951080322265625, -0.18658447265625, -0.16365814208984375, -0.1407318115234375, -0.11780548095703125, -0.094879150390625, -0.07195281982421875, -0.0490264892578125, -0.02610015869140625, -0.003173828125, 0.01975250244140625, 0.0426788330078125, 0.06560516357421875, 0.088531494140625, 0.11145782470703125, 0.1343841552734375, 0.15731048583984375, 0.18023681640625, 0.20316314697265625, 0.2260894775390625, 0.24901580810546875, 0.271942138671875, 0.29486846923828125, 0.3177947998046875, 0.34072113037109375, 0.3636474609375, 0.38657379150390625, 0.4095001220703125, 0.43242645263671875, 0.455352783203125, 0.47827911376953125, 0.5012054443359375, 0.5241317749023438, 0.54705810546875, 0.5699844360351562, 0.5929107666015625, 0.6158370971679688, 0.638763427734375, 0.6616897583007812, 0.6846160888671875, 0.7075424194335938, 0.73046875]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 4.0, 3.0, 1.0, 2.0, 5.0, 0.0, 6.0, 7.0, 9.0, 13.0, 13.0, 13.0, 19.0, 29.0, 23.0, 30.0, 27.0, 27.0, 31.0, 38.0, 23.0, 36.0, 47.0, 43.0, 44.0, 1066.0, 40.0, 36.0, 44.0, 30.0, 45.0, 27.0, 37.0, 26.0, 30.0, 16.0, 23.0, 24.0, 19.0, 15.0, 10.0, 17.0, 7.0, 9.0, 6.0, 5.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.125, -3.9837646484375, -3.842529296875, -3.7012939453125, -3.56005859375, -3.4188232421875, -3.277587890625, -3.1363525390625, -2.9951171875, -2.8538818359375, -2.712646484375, -2.5714111328125, -2.43017578125, -2.2889404296875, -2.147705078125, -2.0064697265625, -1.865234375, -1.7239990234375, -1.582763671875, -1.4415283203125, -1.30029296875, -1.1590576171875, -1.017822265625, -0.8765869140625, -0.7353515625, -0.5941162109375, -0.452880859375, -0.3116455078125, -0.17041015625, -0.0291748046875, 0.112060546875, 0.2532958984375, 0.39453125, 0.5357666015625, 0.677001953125, 0.8182373046875, 0.95947265625, 1.1007080078125, 1.241943359375, 1.3831787109375, 1.5244140625, 1.6656494140625, 1.806884765625, 1.9481201171875, 2.08935546875, 2.2305908203125, 2.371826171875, 2.5130615234375, 2.654296875, 2.7955322265625, 2.936767578125, 3.0780029296875, 3.21923828125, 3.3604736328125, 3.501708984375, 3.6429443359375, 3.7841796875, 3.9254150390625, 4.066650390625, 4.2078857421875, 4.34912109375, 4.4903564453125, 4.631591796875, 4.7728271484375, 4.9140625]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 5.0, 20.0, 15.0, 27.0, 38.0, 97.0, 124.0, 206.0, 362.0, 588.0, 976.0, 1532.0, 2561.0, 4113.0, 6887.0, 11023.0, 17610.0, 28208.0, 44353.0, 70664.0, 105537.0, 146669.0, 1215288.0, 146113.0, 105757.0, 69751.0, 45004.0, 27754.0, 17322.0, 11172.0, 6693.0, 4189.0, 2581.0, 1546.0, 913.0, 575.0, 351.0, 192.0, 118.0, 68.0, 41.0, 28.0, 27.0, 17.0, 11.0, 5.0, 1.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.59619140625, -0.5793952941894531, -0.5625991821289062, -0.5458030700683594, -0.5290069580078125, -0.5122108459472656, -0.49541473388671875, -0.4786186218261719, -0.461822509765625, -0.4450263977050781, -0.42823028564453125, -0.4114341735839844, -0.3946380615234375, -0.3778419494628906, -0.36104583740234375, -0.3442497253417969, -0.32745361328125, -0.3106575012207031, -0.29386138916015625, -0.2770652770996094, -0.2602691650390625, -0.24347305297851562, -0.22667694091796875, -0.20988082885742188, -0.193084716796875, -0.17628860473632812, -0.15949249267578125, -0.14269638061523438, -0.1259002685546875, -0.10910415649414062, -0.09230804443359375, -0.07551193237304688, -0.0587158203125, -0.041919708251953125, -0.02512359619140625, -0.008327484130859375, 0.0084686279296875, 0.025264739990234375, 0.04206085205078125, 0.058856964111328125, 0.075653076171875, 0.09244918823242188, 0.10924530029296875, 0.12604141235351562, 0.1428375244140625, 0.15963363647460938, 0.17642974853515625, 0.19322586059570312, 0.21002197265625, 0.22681808471679688, 0.24361419677734375, 0.2604103088378906, 0.2772064208984375, 0.2940025329589844, 0.31079864501953125, 0.3275947570800781, 0.344390869140625, 0.3611869812011719, 0.37798309326171875, 0.3947792053222656, 0.4115753173828125, 0.4283714294433594, 0.44516754150390625, 0.4619636535644531, 0.478759765625]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 0.0, 2.0, 7.0, 4.0, 8.0, 8.0, 9.0, 17.0, 16.0, 20.0, 26.0, 24.0, 22.0, 36.0, 36.0, 39.0, 58.0, 44.0, 46.0, 50.0, 39.0, 36.0, 50.0, 43.0, 46.0, 47.0, 33.0, 39.0, 34.0, 30.0, 22.0, 20.0, 15.0, 14.0, 17.0, 14.0, 10.0, 7.0, 7.0, 6.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.002166748046875, -0.0020940005779266357, -0.0020212531089782715, -0.0019485056400299072, -0.001875758171081543, -0.0018030107021331787, -0.0017302632331848145, -0.0016575157642364502, -0.001584768295288086, -0.0015120208263397217, -0.0014392733573913574, -0.0013665258884429932, -0.001293778419494629, -0.0012210309505462646, -0.0011482834815979004, -0.0010755360126495361, -0.0010027885437011719, -0.0009300410747528076, -0.0008572936058044434, -0.0007845461368560791, -0.0007117986679077148, -0.0006390511989593506, -0.0005663037300109863, -0.0004935562610626221, -0.0004208087921142578, -0.00034806132316589355, -0.0002753138542175293, -0.00020256638526916504, -0.00012981891632080078, -5.7071447372436523e-05, 1.5676021575927734e-05, 8.842349052429199e-05, 0.00016117095947265625, 0.0002339184284210205, 0.00030666589736938477, 0.000379413366317749, 0.0004521608352661133, 0.0005249083042144775, 0.0005976557731628418, 0.0006704032421112061, 0.0007431507110595703, 0.0008158981800079346, 0.0008886456489562988, 0.0009613931179046631, 0.0010341405868530273, 0.0011068880558013916, 0.0011796355247497559, 0.0012523829936981201, 0.0013251304626464844, 0.0013978779315948486, 0.0014706254005432129, 0.0015433728694915771, 0.0016161203384399414, 0.0016888678073883057, 0.00176161527633667, 0.0018343627452850342, 0.0019071102142333984, 0.0019798576831817627, 0.002052605152130127, 0.002125352621078491, 0.0021981000900268555, 0.0022708475589752197, 0.002343595027923584, 0.0024163424968719482, 0.0024890899658203125]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 7.0, 8.0, 10.0, 20.0, 19.0, 26.0, 26.0, 44.0, 40.0, 67.0, 73.0, 117.0, 158.0, 236.0, 308.0, 559.0, 1183.0, 60846.0, 975846.0, 6702.0, 783.0, 492.0, 289.0, 176.0, 137.0, 89.0, 74.0, 53.0, 50.0, 28.0, 28.0, 12.0, 15.0, 14.0, 5.0, 5.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0], "bins": [-0.06341552734375, -0.06175994873046875, -0.0601043701171875, -0.05844879150390625, -0.056793212890625, -0.05513763427734375, -0.0534820556640625, -0.05182647705078125, -0.0501708984375, -0.04851531982421875, -0.0468597412109375, -0.04520416259765625, -0.043548583984375, -0.04189300537109375, -0.0402374267578125, -0.03858184814453125, -0.03692626953125, -0.03527069091796875, -0.0336151123046875, -0.03195953369140625, -0.030303955078125, -0.02864837646484375, -0.0269927978515625, -0.02533721923828125, -0.023681640625, -0.02202606201171875, -0.0203704833984375, -0.01871490478515625, -0.017059326171875, -0.01540374755859375, -0.0137481689453125, -0.01209259033203125, -0.01043701171875, -0.00878143310546875, -0.0071258544921875, -0.00547027587890625, -0.003814697265625, -0.00215911865234375, -0.0005035400390625, 0.00115203857421875, 0.0028076171875, 0.00446319580078125, 0.0061187744140625, 0.00777435302734375, 0.009429931640625, 0.01108551025390625, 0.0127410888671875, 0.01439666748046875, 0.01605224609375, 0.01770782470703125, 0.0193634033203125, 0.02101898193359375, 0.022674560546875, 0.02433013916015625, 0.0259857177734375, 0.02764129638671875, 0.029296875, 0.03095245361328125, 0.0326080322265625, 0.03426361083984375, 0.035919189453125, 0.03757476806640625, 0.0392303466796875, 0.04088592529296875, 0.04254150390625]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 10.0, 524.0, 468.0, 14.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03573993593454361, -0.035077761858701706, -0.0344155915081501, -0.0337534174323082, -0.03309124708175659, -0.03242907300591469, -0.03176690265536308, -0.03110472857952118, -0.030442556366324425, -0.02978038415312767, -0.029118211939930916, -0.02845603972673416, -0.027793865650892258, -0.027131693437695503, -0.02646952122449875, -0.025807349011301994, -0.02514517679810524, -0.024483004584908485, -0.02382083237171173, -0.023158660158514977, -0.022496487945318222, -0.02183431386947632, -0.021172141656279564, -0.02050996944308281, -0.019847797229886055, -0.0191856250166893, -0.018523452803492546, -0.01786128059029579, -0.017199106514453888, -0.016536934301257133, -0.01587476208806038, -0.015212589874863625, -0.01455041766166687, -0.013888245448470116, -0.013226073235273361, -0.012563900090754032, -0.011901727877557278, -0.011239555664360523, -0.010577382519841194, -0.00991521030664444, -0.009253038093447685, -0.00859086588025093, -0.007928693667054176, -0.007266520522534847, -0.006604348309338093, -0.005942176096141338, -0.005280003417283297, -0.004617830738425255, -0.0039556585252285, -0.0032934860792011023, -0.002631313633173704, -0.001969141187146306, -0.001306968741118908, -0.0006447962950915098, 1.737615093588829e-05, 0.00067954882979393, 0.0013417210429906845, 0.0020038934890180826, 0.0026660659350454807, 0.003328238381072879, 0.003990410827100277, 0.004652583040297031, 0.005314755719155073, 0.005976928398013115, 0.006639100611209869]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 2.0, 4.0, 9.0, 8.0, 6.0, 16.0, 11.0, 16.0, 20.0, 24.0, 32.0, 26.0, 34.0, 37.0, 40.0, 43.0, 44.0, 39.0, 45.0, 44.0, 57.0, 27.0, 49.0, 51.0, 40.0, 32.0, 36.0, 26.0, 39.0, 29.0, 24.0, 17.0, 15.0, 11.0, 12.0, 15.0, 9.0, 4.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015895962715148926, -0.001541762612760067, -0.0014939289540052414, -0.0014460952952504158, -0.0013982616364955902, -0.0013504279777407646, -0.001302594318985939, -0.0012547606602311134, -0.0012069270014762878, -0.0011590933427214622, -0.0011112596839666367, -0.001063426025211811, -0.0010155923664569855, -0.0009677587077021599, -0.0009199250489473343, -0.0008720913901925087, -0.0008242577314376831, -0.0007764240726828575, -0.0007285904139280319, -0.0006807567551732063, -0.0006329230964183807, -0.0005850894376635551, -0.0005372557789087296, -0.000489422120153904, -0.00044158846139907837, -0.0003937548026442528, -0.0003459211438894272, -0.0002980874851346016, -0.000250253826379776, -0.0002024201676249504, -0.00015458650887012482, -0.00010675285011529922, -5.891919136047363e-05, -1.108553260564804e-05, 3.674812614917755e-05, 8.458178490400314e-05, 0.00013241544365882874, 0.00018024910241365433, 0.00022808276116847992, 0.0002759164199233055, 0.0003237500786781311, 0.0003715837374329567, 0.0004194173961877823, 0.0004672510549426079, 0.0005150847136974335, 0.0005629183724522591, 0.0006107520312070847, 0.0006585856899619102, 0.0007064193487167358, 0.0007542530074715614, 0.000802086666226387, 0.0008499203249812126, 0.0008977539837360382, 0.0009455876424908638, 0.0009934213012456894, 0.001041254960000515, 0.0010890886187553406, 0.0011369222775101662, 0.0011847559362649918, 0.0012325895950198174, 0.001280423253774643, 0.0013282569125294685, 0.0013760905712842941, 0.0014239242300391197, 0.0014717578887939453]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 7.0, 7.0, 11.0, 10.0, 15.0, 25.0, 15.0, 20.0, 32.0, 26.0, 40.0, 38.0, 41.0, 30.0, 42.0, 41.0, 33.0, 41.0, 30.0, 45.0, 53.0, 46.0, 35.0, 42.0, 41.0, 23.0, 38.0, 39.0, 22.0, 17.0, 14.0, 12.0, 13.0, 12.0, 10.0, 11.0, 6.0, 4.0, 7.0, 4.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.62109375, -6.38909912109375, -6.1571044921875, -5.92510986328125, -5.693115234375, -5.46112060546875, -5.2291259765625, -4.99713134765625, -4.76513671875, -4.53314208984375, -4.3011474609375, -4.06915283203125, -3.837158203125, -3.60516357421875, -3.3731689453125, -3.14117431640625, -2.9091796875, -2.67718505859375, -2.4451904296875, -2.21319580078125, -1.981201171875, -1.74920654296875, -1.5172119140625, -1.28521728515625, -1.05322265625, -0.82122802734375, -0.5892333984375, -0.35723876953125, -0.125244140625, 0.10675048828125, 0.3387451171875, 0.57073974609375, 0.802734375, 1.03472900390625, 1.2667236328125, 1.49871826171875, 1.730712890625, 1.96270751953125, 2.1947021484375, 2.42669677734375, 2.65869140625, 2.89068603515625, 3.1226806640625, 3.35467529296875, 3.586669921875, 3.81866455078125, 4.0506591796875, 4.28265380859375, 4.5146484375, 4.74664306640625, 4.9786376953125, 5.21063232421875, 5.442626953125, 5.67462158203125, 5.9066162109375, 6.13861083984375, 6.37060546875, 6.60260009765625, 6.8345947265625, 7.06658935546875, 7.298583984375, 7.53057861328125, 7.7625732421875, 7.99456787109375, 8.2265625]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 5.0, 3.0, 3.0, 5.0, 13.0, 9.0, 21.0, 21.0, 39.0, 40.0, 46.0, 70.0, 117.0, 148.0, 238.0, 379.0, 467.0, 710.0, 1119.0, 1819.0, 3093.0, 6273.0, 18845.0, 153711.0, 733705.0, 99624.0, 15065.0, 5263.0, 2838.0, 1631.0, 1017.0, 646.0, 532.0, 312.0, 218.0, 154.0, 98.0, 59.0, 69.0, 39.0, 33.0, 26.0, 10.0, 9.0, 5.0, 7.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-21.390625, -20.78662109375, -20.1826171875, -19.57861328125, -18.974609375, -18.37060546875, -17.7666015625, -17.16259765625, -16.55859375, -15.95458984375, -15.3505859375, -14.74658203125, -14.142578125, -13.53857421875, -12.9345703125, -12.33056640625, -11.7265625, -11.12255859375, -10.5185546875, -9.91455078125, -9.310546875, -8.70654296875, -8.1025390625, -7.49853515625, -6.89453125, -6.29052734375, -5.6865234375, -5.08251953125, -4.478515625, -3.87451171875, -3.2705078125, -2.66650390625, -2.0625, -1.45849609375, -0.8544921875, -0.25048828125, 0.353515625, 0.95751953125, 1.5615234375, 2.16552734375, 2.76953125, 3.37353515625, 3.9775390625, 4.58154296875, 5.185546875, 5.78955078125, 6.3935546875, 6.99755859375, 7.6015625, 8.20556640625, 8.8095703125, 9.41357421875, 10.017578125, 10.62158203125, 11.2255859375, 11.82958984375, 12.43359375, 13.03759765625, 13.6416015625, 14.24560546875, 14.849609375, 15.45361328125, 16.0576171875, 16.66162109375, 17.265625]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 8.0, 7.0, 4.0, 5.0, 15.0, 9.0, 15.0, 12.0, 21.0, 21.0, 18.0, 22.0, 35.0, 30.0, 37.0, 46.0, 65.0, 77.0, 123.0, 358.0, 1522.0, 186.0, 67.0, 45.0, 49.0, 32.0, 35.0, 30.0, 25.0, 22.0, 15.0, 13.0, 13.0, 13.0, 7.0, 10.0, 9.0, 2.0, 7.0, 6.0, 2.0, 2.0, 9.0, 2.0, 2.0, 2.0], "bins": [-21.671875, -21.1038818359375, -20.535888671875, -19.9678955078125, -19.39990234375, -18.8319091796875, -18.263916015625, -17.6959228515625, -17.1279296875, -16.5599365234375, -15.991943359375, -15.4239501953125, -14.85595703125, -14.2879638671875, -13.719970703125, -13.1519775390625, -12.583984375, -12.0159912109375, -11.447998046875, -10.8800048828125, -10.31201171875, -9.7440185546875, -9.176025390625, -8.6080322265625, -8.0400390625, -7.4720458984375, -6.904052734375, -6.3360595703125, -5.76806640625, -5.2000732421875, -4.632080078125, -4.0640869140625, -3.49609375, -2.9281005859375, -2.360107421875, -1.7921142578125, -1.22412109375, -0.6561279296875, -0.088134765625, 0.4798583984375, 1.0478515625, 1.6158447265625, 2.183837890625, 2.7518310546875, 3.31982421875, 3.8878173828125, 4.455810546875, 5.0238037109375, 5.591796875, 6.1597900390625, 6.727783203125, 7.2957763671875, 7.86376953125, 8.4317626953125, 8.999755859375, 9.5677490234375, 10.1357421875, 10.7037353515625, 11.271728515625, 11.8397216796875, 12.40771484375, 12.9757080078125, 13.543701171875, 14.1116943359375, 14.6796875]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 3.0, 5.0, 7.0, 10.0, 9.0, 12.0, 18.0, 29.0, 37.0, 42.0, 59.0, 86.0, 138.0, 227.0, 448.0, 1158.0, 21152.0, 3116365.0, 4051.0, 794.0, 375.0, 221.0, 135.0, 93.0, 77.0, 44.0, 29.0, 14.0, 13.0, 15.0, 12.0, 10.0, 6.0, 7.0, 6.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-78.8125, -76.58203125, -74.3515625, -72.12109375, -69.890625, -67.66015625, -65.4296875, -63.19921875, -60.96875, -58.73828125, -56.5078125, -54.27734375, -52.046875, -49.81640625, -47.5859375, -45.35546875, -43.125, -40.89453125, -38.6640625, -36.43359375, -34.203125, -31.97265625, -29.7421875, -27.51171875, -25.28125, -23.05078125, -20.8203125, -18.58984375, -16.359375, -14.12890625, -11.8984375, -9.66796875, -7.4375, -5.20703125, -2.9765625, -0.74609375, 1.484375, 3.71484375, 5.9453125, 8.17578125, 10.40625, 12.63671875, 14.8671875, 17.09765625, 19.328125, 21.55859375, 23.7890625, 26.01953125, 28.25, 30.48046875, 32.7109375, 34.94140625, 37.171875, 39.40234375, 41.6328125, 43.86328125, 46.09375, 48.32421875, 50.5546875, 52.78515625, 55.015625, 57.24609375, 59.4765625, 61.70703125, 63.9375]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 12.0, 88.0, 374.0, 434.0, 97.0, 10.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-115.78763580322266, -111.15155792236328, -106.51548767089844, -101.87940979003906, -97.24333190917969, -92.60725402832031, -87.97117614746094, -83.3351058959961, -78.69902801513672, -74.06295013427734, -69.4268798828125, -64.79080200195312, -60.15472412109375, -55.518646240234375, -50.882572174072266, -46.246498107910156, -41.61042022705078, -36.974342346191406, -32.3382682800293, -27.702192306518555, -23.066116333007812, -18.43004035949707, -13.793964385986328, -9.157890319824219, -4.521812438964844, 0.11426353454589844, 4.750339508056641, 9.386415481567383, 14.022491455078125, 18.658567428588867, 23.29464340209961, 27.93071746826172, 32.56678771972656, 37.20286560058594, 41.83893966674805, 46.475013732910156, 51.11109161376953, 55.747169494628906, 60.383243560791016, 65.01931762695312, 69.6553955078125, 74.29147338867188, 78.92755126953125, 83.5636215209961, 88.19969940185547, 92.83577728271484, 97.47184753417969, 102.10792541503906, 106.74400329589844, 111.38008117675781, 116.01615905761719, 120.65222930908203, 125.2883071899414, 129.92437744140625, 134.56045532226562, 139.196533203125, 143.83261108398438, 148.46868896484375, 153.10476684570312, 157.7408447265625, 162.37692260742188, 167.0129852294922, 171.64906311035156, 176.28514099121094, 180.9212188720703]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 3.0, 1.0, 3.0, 6.0, 9.0, 6.0, 6.0, 12.0, 14.0, 14.0, 16.0, 20.0, 22.0, 24.0, 26.0, 23.0, 41.0, 29.0, 26.0, 34.0, 24.0, 28.0, 43.0, 40.0, 43.0, 41.0, 32.0, 32.0, 40.0, 36.0, 37.0, 21.0, 29.0, 27.0, 16.0, 28.0, 20.0, 24.0, 20.0, 17.0, 7.0, 13.0, 4.0, 12.0, 13.0, 4.0, 6.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 3.0, 4.0], "bins": [-44.91546630859375, -43.57817840576172, -42.24089050292969, -40.903602600097656, -39.56631088256836, -38.22902297973633, -36.8917350769043, -35.554447174072266, -34.217159271240234, -32.8798713684082, -31.54258155822754, -30.205293655395508, -28.868005752563477, -27.530715942382812, -26.19342803955078, -24.85614013671875, -23.518850326538086, -22.181562423706055, -20.84427261352539, -19.50698471069336, -18.169696807861328, -16.832408905029297, -15.495119094848633, -14.157831192016602, -12.820542335510254, -11.483253479003906, -10.145965576171875, -8.808676719665527, -7.471388339996338, -6.134099960327148, -4.796811103820801, -3.4595232009887695, -2.122234344482422, -0.7849458456039429, 0.5523426532745361, 1.8896312713623047, 3.226919651031494, 4.564208030700684, 5.901496887207031, 7.2387847900390625, 8.57607364654541, 9.913362503051758, 11.250650405883789, 12.587939262390137, 13.925228118896484, 15.262516021728516, 16.599803924560547, 17.937091827392578, 19.274381637573242, 20.611669540405273, 21.948959350585938, 23.28624725341797, 24.62353515625, 25.96082305908203, 27.298112869262695, 28.635400772094727, 29.97269058227539, 31.309978485107422, 32.64726638793945, 33.98455810546875, 35.32184600830078, 36.65913391113281, 37.996421813964844, 39.333709716796875, 40.670997619628906]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 2.0, 8.0, 4.0, 8.0, 10.0, 13.0, 9.0, 12.0, 27.0, 17.0, 21.0, 20.0, 32.0, 27.0, 37.0, 30.0, 29.0, 23.0, 45.0, 37.0, 50.0, 52.0, 30.0, 44.0, 43.0, 43.0, 29.0, 30.0, 32.0, 24.0, 32.0, 20.0, 24.0, 26.0, 18.0, 14.0, 14.0, 11.0, 8.0, 8.0, 7.0, 9.0, 3.0, 3.0, 3.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 4.0], "bins": [-6.58984375, -6.369140625, -6.1484375, -5.927734375, -5.70703125, -5.486328125, -5.265625, -5.044921875, -4.82421875, -4.603515625, -4.3828125, -4.162109375, -3.94140625, -3.720703125, -3.5, -3.279296875, -3.05859375, -2.837890625, -2.6171875, -2.396484375, -2.17578125, -1.955078125, -1.734375, -1.513671875, -1.29296875, -1.072265625, -0.8515625, -0.630859375, -0.41015625, -0.189453125, 0.03125, 0.251953125, 0.47265625, 0.693359375, 0.9140625, 1.134765625, 1.35546875, 1.576171875, 1.796875, 2.017578125, 2.23828125, 2.458984375, 2.6796875, 2.900390625, 3.12109375, 3.341796875, 3.5625, 3.783203125, 4.00390625, 4.224609375, 4.4453125, 4.666015625, 4.88671875, 5.107421875, 5.328125, 5.548828125, 5.76953125, 5.990234375, 6.2109375, 6.431640625, 6.65234375, 6.873046875, 7.09375, 7.314453125, 7.53515625]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 6.0, 2.0, 7.0, 7.0, 18.0, 18.0, 30.0, 26.0, 31.0, 45.0, 71.0, 68.0, 102.0, 126.0, 178.0, 269.0, 333.0, 514.0, 737.0, 1216.0, 2095.0, 4366.0, 11827.0, 69532.0, 790289.0, 2655722.0, 590392.0, 46702.0, 9946.0, 3952.0, 2065.0, 1168.0, 725.0, 462.0, 316.0, 213.0, 172.0, 116.0, 110.0, 79.0, 54.0, 51.0, 25.0, 33.0, 18.0, 15.0, 10.0, 10.0, 10.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-14.2734375, -13.804443359375, -13.33544921875, -12.866455078125, -12.3974609375, -11.928466796875, -11.45947265625, -10.990478515625, -10.521484375, -10.052490234375, -9.58349609375, -9.114501953125, -8.6455078125, -8.176513671875, -7.70751953125, -7.238525390625, -6.76953125, -6.300537109375, -5.83154296875, -5.362548828125, -4.8935546875, -4.424560546875, -3.95556640625, -3.486572265625, -3.017578125, -2.548583984375, -2.07958984375, -1.610595703125, -1.1416015625, -0.672607421875, -0.20361328125, 0.265380859375, 0.734375, 1.203369140625, 1.67236328125, 2.141357421875, 2.6103515625, 3.079345703125, 3.54833984375, 4.017333984375, 4.486328125, 4.955322265625, 5.42431640625, 5.893310546875, 6.3623046875, 6.831298828125, 7.30029296875, 7.769287109375, 8.23828125, 8.707275390625, 9.17626953125, 9.645263671875, 10.1142578125, 10.583251953125, 11.05224609375, 11.521240234375, 11.990234375, 12.459228515625, 12.92822265625, 13.397216796875, 13.8662109375, 14.335205078125, 14.80419921875, 15.273193359375, 15.7421875]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 2.0, 6.0, 3.0, 13.0, 19.0, 29.0, 48.0, 79.0, 122.0, 205.0, 314.0, 537.0, 774.0, 718.0, 454.0, 310.0, 184.0, 113.0, 59.0, 32.0, 18.0, 16.0, 8.0, 3.0, 1.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.3671875, -13.7659912109375, -13.164794921875, -12.5635986328125, -11.96240234375, -11.3612060546875, -10.760009765625, -10.1588134765625, -9.5576171875, -8.9564208984375, -8.355224609375, -7.7540283203125, -7.15283203125, -6.5516357421875, -5.950439453125, -5.3492431640625, -4.748046875, -4.1468505859375, -3.545654296875, -2.9444580078125, -2.34326171875, -1.7420654296875, -1.140869140625, -0.5396728515625, 0.0615234375, 0.6627197265625, 1.263916015625, 1.8651123046875, 2.46630859375, 3.0675048828125, 3.668701171875, 4.2698974609375, 4.87109375, 5.4722900390625, 6.073486328125, 6.6746826171875, 7.27587890625, 7.8770751953125, 8.478271484375, 9.0794677734375, 9.6806640625, 10.2818603515625, 10.883056640625, 11.4842529296875, 12.08544921875, 12.6866455078125, 13.287841796875, 13.8890380859375, 14.490234375, 15.0914306640625, 15.692626953125, 16.2938232421875, 16.89501953125, 17.4962158203125, 18.097412109375, 18.6986083984375, 19.2998046875, 19.9010009765625, 20.502197265625, 21.1033935546875, 21.70458984375, 22.3057861328125, 22.906982421875, 23.5081787109375, 24.109375]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 5.0, 5.0, 15.0, 20.0, 31.0, 37.0, 85.0, 144.0, 321.0, 704.0, 2021.0, 18326.0, 3935917.0, 230169.0, 4321.0, 1166.0, 472.0, 229.0, 123.0, 77.0, 26.0, 24.0, 18.0, 2.0, 7.0, 6.0, 5.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-56.5625, -55.173828125, -53.78515625, -52.396484375, -51.0078125, -49.619140625, -48.23046875, -46.841796875, -45.453125, -44.064453125, -42.67578125, -41.287109375, -39.8984375, -38.509765625, -37.12109375, -35.732421875, -34.34375, -32.955078125, -31.56640625, -30.177734375, -28.7890625, -27.400390625, -26.01171875, -24.623046875, -23.234375, -21.845703125, -20.45703125, -19.068359375, -17.6796875, -16.291015625, -14.90234375, -13.513671875, -12.125, -10.736328125, -9.34765625, -7.958984375, -6.5703125, -5.181640625, -3.79296875, -2.404296875, -1.015625, 0.373046875, 1.76171875, 3.150390625, 4.5390625, 5.927734375, 7.31640625, 8.705078125, 10.09375, 11.482421875, 12.87109375, 14.259765625, 15.6484375, 17.037109375, 18.42578125, 19.814453125, 21.203125, 22.591796875, 23.98046875, 25.369140625, 26.7578125, 28.146484375, 29.53515625, 30.923828125, 32.3125]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 8.0, 25.0, 137.0, 277.0, 355.0, 164.0, 39.0, 9.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.05208587646484, -66.65472412109375, -62.257362365722656, -57.86000061035156, -53.46263885498047, -49.065277099609375, -44.66791915893555, -40.27055740356445, -35.87319564819336, -31.475833892822266, -27.078472137451172, -22.68111228942871, -18.283750534057617, -13.886388778686523, -9.489028930664062, -5.091667175292969, -0.694305419921875, 3.7030558586120605, 8.100417137145996, 12.497777938842773, 16.895139694213867, 21.29250144958496, 25.689861297607422, 30.087223052978516, 34.48458480834961, 38.8819465637207, 43.2793083190918, 47.676666259765625, 52.07402801513672, 56.47138977050781, 60.868751525878906, 65.26611328125, 69.66348266601562, 74.06084442138672, 78.45820617675781, 82.8555679321289, 87.2529296875, 91.6502914428711, 96.04765319824219, 100.44500732421875, 104.84237670898438, 109.23973846435547, 113.63710021972656, 118.03446197509766, 122.43182373046875, 126.82918548583984, 131.22654724121094, 135.6239013671875, 140.02127075195312, 144.4186248779297, 148.8159942626953, 153.21334838867188, 157.6107177734375, 162.00807189941406, 166.4054412841797, 170.80279541015625, 175.2001495361328, 179.59750366210938, 183.994873046875, 188.39222717285156, 192.7895965576172, 197.18695068359375, 201.58432006835938, 205.98167419433594, 210.37904357910156]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 4.0, 2.0, 7.0, 7.0, 5.0, 5.0, 14.0, 15.0, 11.0, 12.0, 20.0, 22.0, 29.0, 25.0, 22.0, 29.0, 33.0, 36.0, 24.0, 30.0, 44.0, 40.0, 42.0, 46.0, 47.0, 32.0, 42.0, 38.0, 29.0, 35.0, 32.0, 24.0, 28.0, 18.0, 18.0, 27.0, 13.0, 21.0, 13.0, 11.0, 12.0, 14.0, 4.0, 4.0, 9.0, 8.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0], "bins": [-42.887542724609375, -41.56871795654297, -40.24989318847656, -38.93106460571289, -37.612239837646484, -36.29341506958008, -34.97459030151367, -33.655765533447266, -32.336936950683594, -31.018112182617188, -29.69928550720215, -28.380460739135742, -27.061634063720703, -25.742809295654297, -24.42398452758789, -23.105159759521484, -21.786334991455078, -20.467510223388672, -19.148683547973633, -17.829858779907227, -16.511032104492188, -15.192207336425781, -13.873382568359375, -12.554556846618652, -11.23573112487793, -9.916905403137207, -8.598079681396484, -7.279254913330078, -5.9604291915893555, -4.641603469848633, -3.3227782249450684, -2.003952980041504, -0.6851272583007812, 0.6336982250213623, 1.9525237083435059, 3.2713491916656494, 4.590174674987793, 5.909000396728516, 7.22782564163208, 8.546650886535645, 9.865476608276367, 11.18430233001709, 12.503128051757812, 13.821952819824219, 15.140778541564941, 16.459604263305664, 17.77842903137207, 19.09725570678711, 20.416080474853516, 21.734905242919922, 23.05373191833496, 24.372556686401367, 25.691383361816406, 27.010208129882812, 28.32903289794922, 29.647857666015625, 30.966684341430664, 32.2855110168457, 33.60433578491211, 34.923160552978516, 36.24198532104492, 37.560813903808594, 38.879638671875, 40.198463439941406, 41.51728820800781]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 4.0, 10.0, 7.0, 8.0, 13.0, 20.0, 15.0, 14.0, 17.0, 31.0, 35.0, 36.0, 28.0, 22.0, 29.0, 33.0, 29.0, 38.0, 37.0, 32.0, 36.0, 52.0, 30.0, 37.0, 43.0, 40.0, 38.0, 34.0, 23.0, 25.0, 28.0, 22.0, 21.0, 26.0, 18.0, 15.0, 15.0, 5.0, 10.0, 5.0, 2.0, 4.0, 9.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.359375, -5.189697265625, -5.02001953125, -4.850341796875, -4.6806640625, -4.510986328125, -4.34130859375, -4.171630859375, -4.001953125, -3.832275390625, -3.66259765625, -3.492919921875, -3.3232421875, -3.153564453125, -2.98388671875, -2.814208984375, -2.64453125, -2.474853515625, -2.30517578125, -2.135498046875, -1.9658203125, -1.796142578125, -1.62646484375, -1.456787109375, -1.287109375, -1.117431640625, -0.94775390625, -0.778076171875, -0.6083984375, -0.438720703125, -0.26904296875, -0.099365234375, 0.0703125, 0.239990234375, 0.40966796875, 0.579345703125, 0.7490234375, 0.918701171875, 1.08837890625, 1.258056640625, 1.427734375, 1.597412109375, 1.76708984375, 1.936767578125, 2.1064453125, 2.276123046875, 2.44580078125, 2.615478515625, 2.78515625, 2.954833984375, 3.12451171875, 3.294189453125, 3.4638671875, 3.633544921875, 3.80322265625, 3.972900390625, 4.142578125, 4.312255859375, 4.48193359375, 4.651611328125, 4.8212890625, 4.990966796875, 5.16064453125, 5.330322265625, 5.5]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 7.0, 6.0, 5.0, 11.0, 23.0, 39.0, 60.0, 87.0, 128.0, 216.0, 280.0, 388.0, 570.0, 807.0, 1218.0, 1748.0, 2287.0, 3431.0, 5201.0, 7592.0, 11584.0, 17279.0, 26939.0, 42103.0, 63906.0, 96468.0, 136084.0, 163773.0, 146855.0, 108526.0, 72287.0, 47569.0, 30928.0, 19825.0, 13106.0, 8751.0, 5846.0, 3980.0, 2644.0, 1849.0, 1323.0, 829.0, 641.0, 433.0, 307.0, 215.0, 134.0, 104.0, 68.0, 32.0, 28.0, 15.0, 10.0, 9.0, 9.0, 6.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.446533203125, -0.4319648742675781, -0.41739654541015625, -0.4028282165527344, -0.3882598876953125, -0.3736915588378906, -0.35912322998046875, -0.3445549011230469, -0.329986572265625, -0.3154182434082031, -0.30084991455078125, -0.2862815856933594, -0.2717132568359375, -0.2571449279785156, -0.24257659912109375, -0.22800827026367188, -0.21343994140625, -0.19887161254882812, -0.18430328369140625, -0.16973495483398438, -0.1551666259765625, -0.14059829711914062, -0.12602996826171875, -0.11146163940429688, -0.096893310546875, -0.08232498168945312, -0.06775665283203125, -0.053188323974609375, -0.0386199951171875, -0.024051666259765625, -0.00948333740234375, 0.005084991455078125, 0.0196533203125, 0.034221649169921875, 0.04878997802734375, 0.06335830688476562, 0.0779266357421875, 0.09249496459960938, 0.10706329345703125, 0.12163162231445312, 0.136199951171875, 0.15076828002929688, 0.16533660888671875, 0.17990493774414062, 0.1944732666015625, 0.20904159545898438, 0.22360992431640625, 0.23817825317382812, 0.25274658203125, 0.2673149108886719, 0.28188323974609375, 0.2964515686035156, 0.3110198974609375, 0.3255882263183594, 0.34015655517578125, 0.3547248840332031, 0.369293212890625, 0.3838615417480469, 0.39842987060546875, 0.4129981994628906, 0.4275665283203125, 0.4421348571777344, 0.45670318603515625, 0.4712715148925781, 0.48583984375]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 2.0, 7.0, 5.0, 7.0, 13.0, 6.0, 6.0, 7.0, 14.0, 18.0, 11.0, 17.0, 28.0, 29.0, 35.0, 32.0, 29.0, 40.0, 36.0, 36.0, 31.0, 44.0, 1069.0, 43.0, 38.0, 38.0, 33.0, 40.0, 39.0, 33.0, 27.0, 33.0, 21.0, 28.0, 25.0, 30.0, 14.0, 12.0, 8.0, 9.0, 7.0, 4.0, 6.0, 4.0, 7.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.33203125, -3.21734619140625, -3.1026611328125, -2.98797607421875, -2.873291015625, -2.75860595703125, -2.6439208984375, -2.52923583984375, -2.41455078125, -2.29986572265625, -2.1851806640625, -2.07049560546875, -1.955810546875, -1.84112548828125, -1.7264404296875, -1.61175537109375, -1.4970703125, -1.38238525390625, -1.2677001953125, -1.15301513671875, -1.038330078125, -0.92364501953125, -0.8089599609375, -0.69427490234375, -0.57958984375, -0.46490478515625, -0.3502197265625, -0.23553466796875, -0.120849609375, -0.00616455078125, 0.1085205078125, 0.22320556640625, 0.337890625, 0.45257568359375, 0.5672607421875, 0.68194580078125, 0.796630859375, 0.91131591796875, 1.0260009765625, 1.14068603515625, 1.25537109375, 1.37005615234375, 1.4847412109375, 1.59942626953125, 1.714111328125, 1.82879638671875, 1.9434814453125, 2.05816650390625, 2.1728515625, 2.28753662109375, 2.4022216796875, 2.51690673828125, 2.631591796875, 2.74627685546875, 2.8609619140625, 2.97564697265625, 3.09033203125, 3.20501708984375, 3.3197021484375, 3.43438720703125, 3.549072265625, 3.66375732421875, 3.7784423828125, 3.89312744140625, 4.0078125]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 10.0, 11.0, 19.0, 28.0, 54.0, 70.0, 140.0, 230.0, 393.0, 609.0, 1145.0, 1863.0, 3087.0, 5359.0, 8868.0, 15267.0, 25898.0, 44093.0, 73825.0, 119166.0, 168667.0, 1232717.0, 149002.0, 99702.0, 60044.0, 35688.0, 21087.0, 12398.0, 7303.0, 4260.0, 2573.0, 1419.0, 858.0, 502.0, 305.0, 182.0, 131.0, 63.0, 40.0, 27.0, 16.0, 8.0, 6.0, 3.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.52783203125, -0.5124435424804688, -0.4970550537109375, -0.48166656494140625, -0.466278076171875, -0.45088958740234375, -0.4355010986328125, -0.42011260986328125, -0.40472412109375, -0.38933563232421875, -0.3739471435546875, -0.35855865478515625, -0.343170166015625, -0.32778167724609375, -0.3123931884765625, -0.29700469970703125, -0.2816162109375, -0.26622772216796875, -0.2508392333984375, -0.23545074462890625, -0.220062255859375, -0.20467376708984375, -0.1892852783203125, -0.17389678955078125, -0.15850830078125, -0.14311981201171875, -0.1277313232421875, -0.11234283447265625, -0.096954345703125, -0.08156585693359375, -0.0661773681640625, -0.05078887939453125, -0.035400390625, -0.02001190185546875, -0.0046234130859375, 0.01076507568359375, 0.026153564453125, 0.04154205322265625, 0.0569305419921875, 0.07231903076171875, 0.08770751953125, 0.10309600830078125, 0.1184844970703125, 0.13387298583984375, 0.149261474609375, 0.16464996337890625, 0.1800384521484375, 0.19542694091796875, 0.2108154296875, 0.22620391845703125, 0.2415924072265625, 0.25698089599609375, 0.272369384765625, 0.28775787353515625, 0.3031463623046875, 0.31853485107421875, 0.33392333984375, 0.34931182861328125, 0.3647003173828125, 0.38008880615234375, 0.395477294921875, 0.41086578369140625, 0.4262542724609375, 0.44164276123046875, 0.45703125]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 6.0, 12.0, 3.0, 17.0, 18.0, 19.0, 17.0, 25.0, 27.0, 29.0, 37.0, 33.0, 55.0, 49.0, 52.0, 55.0, 50.0, 57.0, 57.0, 65.0, 50.0, 34.0, 38.0, 39.0, 28.0, 31.0, 23.0, 25.0, 9.0, 9.0, 15.0, 7.0, 6.0, 5.0, 3.0, 2.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001773834228515625, -0.0017108023166656494, -0.0016477704048156738, -0.0015847384929656982, -0.0015217065811157227, -0.001458674669265747, -0.0013956427574157715, -0.001332610845565796, -0.0012695789337158203, -0.0012065470218658447, -0.0011435151100158691, -0.0010804831981658936, -0.001017451286315918, -0.0009544193744659424, -0.0008913874626159668, -0.0008283555507659912, -0.0007653236389160156, -0.00070229172706604, -0.0006392598152160645, -0.0005762279033660889, -0.0005131959915161133, -0.0004501640796661377, -0.0003871321678161621, -0.0003241002559661865, -0.00026106834411621094, -0.00019803643226623535, -0.00013500452041625977, -7.197260856628418e-05, -8.940696716308594e-06, 5.409121513366699e-05, 0.00011712312698364258, 0.00018015503883361816, 0.00024318695068359375, 0.00030621886253356934, 0.0003692507743835449, 0.0004322826862335205, 0.0004953145980834961, 0.0005583465099334717, 0.0006213784217834473, 0.0006844103336334229, 0.0007474422454833984, 0.000810474157333374, 0.0008735060691833496, 0.0009365379810333252, 0.0009995698928833008, 0.0010626018047332764, 0.001125633716583252, 0.0011886656284332275, 0.0012516975402832031, 0.0013147294521331787, 0.0013777613639831543, 0.0014407932758331299, 0.0015038251876831055, 0.001566857099533081, 0.0016298890113830566, 0.0016929209232330322, 0.0017559528350830078, 0.0018189847469329834, 0.001882016658782959, 0.0019450485706329346, 0.00200808048248291, 0.0020711123943328857, 0.0021341443061828613, 0.002197176218032837, 0.0022602081298828125]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 7.0, 5.0, 7.0, 10.0, 7.0, 14.0, 18.0, 19.0, 33.0, 32.0, 40.0, 50.0, 78.0, 99.0, 123.0, 204.0, 261.0, 397.0, 709.0, 2458.0, 891582.0, 149158.0, 1340.0, 603.0, 374.0, 249.0, 171.0, 125.0, 74.0, 60.0, 57.0, 49.0, 39.0, 27.0, 25.0, 14.0, 9.0, 14.0, 6.0, 6.0, 1.0, 3.0, 0.0, 3.0, 2.0, 2.0, 2.0, 1.0], "bins": [-0.04388427734375, -0.042693138122558594, -0.04150199890136719, -0.04031085968017578, -0.039119720458984375, -0.03792858123779297, -0.03673744201660156, -0.035546302795410156, -0.03435516357421875, -0.033164024353027344, -0.03197288513183594, -0.03078174591064453, -0.029590606689453125, -0.02839946746826172, -0.027208328247070312, -0.026017189025878906, -0.0248260498046875, -0.023634910583496094, -0.022443771362304688, -0.02125263214111328, -0.020061492919921875, -0.01887035369873047, -0.017679214477539062, -0.016488075256347656, -0.01529693603515625, -0.014105796813964844, -0.012914657592773438, -0.011723518371582031, -0.010532379150390625, -0.009341239929199219, -0.008150100708007812, -0.006958961486816406, -0.005767822265625, -0.004576683044433594, -0.0033855438232421875, -0.0021944046020507812, -0.001003265380859375, 0.00018787384033203125, 0.0013790130615234375, 0.0025701522827148438, 0.00376129150390625, 0.004952430725097656, 0.0061435699462890625, 0.007334709167480469, 0.008525848388671875, 0.009716987609863281, 0.010908126831054688, 0.012099266052246094, 0.0132904052734375, 0.014481544494628906, 0.015672683715820312, 0.01686382293701172, 0.018054962158203125, 0.01924610137939453, 0.020437240600585938, 0.021628379821777344, 0.02281951904296875, 0.024010658264160156, 0.025201797485351562, 0.02639293670654297, 0.027584075927734375, 0.02877521514892578, 0.029966354370117188, 0.031157493591308594, 0.0323486328125]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 15.0, 170.0, 627.0, 193.0, 6.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.007932843640446663, -0.007702961564064026, -0.007473079487681389, -0.007243197411298752, -0.007013315334916115, -0.006783433258533478, -0.0065535507164895535, -0.006323668640106916, -0.006093786563724279, -0.005863904487341642, -0.005634022410959005, -0.005404140334576368, -0.005174257792532444, -0.004944375716149807, -0.00471449363976717, -0.004484611563384533, -0.004254729487001896, -0.004024847410619259, -0.003794965334236622, -0.003565083025023341, -0.003335200948640704, -0.003105318872258067, -0.0028754365630447865, -0.0026455544866621494, -0.0024156724102795124, -0.0021857903338968754, -0.0019559082575142384, -0.0017260259483009577, -0.0014961438719183207, -0.0012662617955356836, -0.0010363796027377248, -0.0008064974099397659, -0.0005766157992184162, -0.0003467336646281183, -0.00011685153003782034, 0.0001130306045524776, 0.00034291273914277554, 0.0005727948155254126, 0.0008026770083233714, 0.0010325592011213303, 0.0012624412775039673, 0.0014923233538866043, 0.0017222055466845632, 0.001952087739482522, 0.002181969815865159, 0.002411851892247796, 0.0026417342014610767, 0.0028716162778437138, 0.003101498354226351, 0.003331380430608988, 0.003561262506991625, 0.0037911448162049055, 0.004021027125418186, 0.004250909201800823, 0.00448079127818346, 0.004710673354566097, 0.004940555430948734, 0.005170437507331371, 0.005400319583714008, 0.005630201660096645, 0.005860083736479282, 0.006089965812861919, 0.006319848354905844, 0.006549730431288481, 0.006779612507671118]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 5.0, 2.0, 7.0, 5.0, 7.0, 8.0, 10.0, 12.0, 16.0, 19.0, 24.0, 15.0, 21.0, 33.0, 20.0, 39.0, 32.0, 30.0, 32.0, 39.0, 40.0, 39.0, 46.0, 40.0, 42.0, 42.0, 38.0, 43.0, 48.0, 31.0, 30.0, 30.0, 20.0, 27.0, 31.0, 17.0, 17.0, 10.0, 16.0, 8.0, 5.0, 4.0, 3.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.0011107921600341797, -0.0010784519836306572, -0.0010461118072271347, -0.0010137716308236122, -0.0009814314544200897, -0.0009490912780165672, -0.0009167511016130447, -0.0008844109252095222, -0.0008520707488059998, -0.0008197305724024773, -0.0007873903959989548, -0.0007550502195954323, -0.0007227100431919098, -0.0006903698667883873, -0.0006580296903848648, -0.0006256895139813423, -0.0005933493375778198, -0.0005610091611742973, -0.0005286689847707748, -0.0004963288083672523, -0.00046398863196372986, -0.00043164845556020737, -0.0003993082791566849, -0.0003669681027531624, -0.0003346279263496399, -0.0003022877499461174, -0.0002699475735425949, -0.00023760739713907242, -0.00020526722073554993, -0.00017292704433202744, -0.00014058686792850494, -0.00010824669152498245, -7.590651512145996e-05, -4.356633871793747e-05, -1.1226162314414978e-05, 2.1114014089107513e-05, 5.3454190492630005e-05, 8.57943668961525e-05, 0.00011813454329967499, 0.00015047471970319748, 0.00018281489610671997, 0.00021515507251024246, 0.00024749524891376495, 0.00027983542531728745, 0.00031217560172080994, 0.00034451577812433243, 0.0003768559545278549, 0.0004091961309313774, 0.0004415363073348999, 0.0004738764837384224, 0.0005062166601419449, 0.0005385568365454674, 0.0005708970129489899, 0.0006032371893525124, 0.0006355773657560349, 0.0006679175421595573, 0.0007002577185630798, 0.0007325978949666023, 0.0007649380713701248, 0.0007972782477736473, 0.0008296184241771698, 0.0008619586005806923, 0.0008942987769842148, 0.0009266389533877373, 0.0009589791297912598]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 4.0, 10.0, 7.0, 8.0, 13.0, 20.0, 15.0, 14.0, 17.0, 31.0, 35.0, 36.0, 28.0, 22.0, 29.0, 33.0, 29.0, 39.0, 36.0, 32.0, 36.0, 52.0, 30.0, 37.0, 43.0, 40.0, 38.0, 34.0, 23.0, 25.0, 28.0, 22.0, 21.0, 27.0, 17.0, 15.0, 15.0, 5.0, 10.0, 5.0, 2.0, 4.0, 9.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.359375, -5.189697265625, -5.02001953125, -4.850341796875, -4.6806640625, -4.510986328125, -4.34130859375, -4.171630859375, -4.001953125, -3.832275390625, -3.66259765625, -3.492919921875, -3.3232421875, -3.153564453125, -2.98388671875, -2.814208984375, -2.64453125, -2.474853515625, -2.30517578125, -2.135498046875, -1.9658203125, -1.796142578125, -1.62646484375, -1.456787109375, -1.287109375, -1.117431640625, -0.94775390625, -0.778076171875, -0.6083984375, -0.438720703125, -0.26904296875, -0.099365234375, 0.0703125, 0.239990234375, 0.40966796875, 0.579345703125, 0.7490234375, 0.918701171875, 1.08837890625, 1.258056640625, 1.427734375, 1.597412109375, 1.76708984375, 1.936767578125, 2.1064453125, 2.276123046875, 2.44580078125, 2.615478515625, 2.78515625, 2.954833984375, 3.12451171875, 3.294189453125, 3.4638671875, 3.633544921875, 3.80322265625, 3.972900390625, 4.142578125, 4.312255859375, 4.48193359375, 4.651611328125, 4.8212890625, 4.990966796875, 5.16064453125, 5.330322265625, 5.5]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 6.0, 9.0, 6.0, 11.0, 27.0, 28.0, 17.0, 55.0, 62.0, 72.0, 121.0, 121.0, 201.0, 301.0, 446.0, 648.0, 1095.0, 1856.0, 3906.0, 10705.0, 38054.0, 201413.0, 604108.0, 140026.0, 28655.0, 8510.0, 3444.0, 1691.0, 1009.0, 604.0, 385.0, 279.0, 187.0, 134.0, 98.0, 73.0, 52.0, 33.0, 31.0, 26.0, 13.0, 7.0, 12.0, 7.0, 5.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.4296875, -9.12939453125, -8.8291015625, -8.52880859375, -8.228515625, -7.92822265625, -7.6279296875, -7.32763671875, -7.02734375, -6.72705078125, -6.4267578125, -6.12646484375, -5.826171875, -5.52587890625, -5.2255859375, -4.92529296875, -4.625, -4.32470703125, -4.0244140625, -3.72412109375, -3.423828125, -3.12353515625, -2.8232421875, -2.52294921875, -2.22265625, -1.92236328125, -1.6220703125, -1.32177734375, -1.021484375, -0.72119140625, -0.4208984375, -0.12060546875, 0.1796875, 0.47998046875, 0.7802734375, 1.08056640625, 1.380859375, 1.68115234375, 1.9814453125, 2.28173828125, 2.58203125, 2.88232421875, 3.1826171875, 3.48291015625, 3.783203125, 4.08349609375, 4.3837890625, 4.68408203125, 4.984375, 5.28466796875, 5.5849609375, 5.88525390625, 6.185546875, 6.48583984375, 6.7861328125, 7.08642578125, 7.38671875, 7.68701171875, 7.9873046875, 8.28759765625, 8.587890625, 8.88818359375, 9.1884765625, 9.48876953125, 9.7890625]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 8.0, 2.0, 2.0, 7.0, 6.0, 10.0, 9.0, 20.0, 17.0, 34.0, 35.0, 40.0, 52.0, 57.0, 61.0, 101.0, 282.0, 1688.0, 176.0, 104.0, 63.0, 46.0, 43.0, 46.0, 34.0, 25.0, 11.0, 16.0, 18.0, 9.0, 6.0, 7.0, 3.0, 2.0, 4.0, 0.0, 1.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.078125, -16.49560546875, -15.9130859375, -15.33056640625, -14.748046875, -14.16552734375, -13.5830078125, -13.00048828125, -12.41796875, -11.83544921875, -11.2529296875, -10.67041015625, -10.087890625, -9.50537109375, -8.9228515625, -8.34033203125, -7.7578125, -7.17529296875, -6.5927734375, -6.01025390625, -5.427734375, -4.84521484375, -4.2626953125, -3.68017578125, -3.09765625, -2.51513671875, -1.9326171875, -1.35009765625, -0.767578125, -0.18505859375, 0.3974609375, 0.97998046875, 1.5625, 2.14501953125, 2.7275390625, 3.31005859375, 3.892578125, 4.47509765625, 5.0576171875, 5.64013671875, 6.22265625, 6.80517578125, 7.3876953125, 7.97021484375, 8.552734375, 9.13525390625, 9.7177734375, 10.30029296875, 10.8828125, 11.46533203125, 12.0478515625, 12.63037109375, 13.212890625, 13.79541015625, 14.3779296875, 14.96044921875, 15.54296875, 16.12548828125, 16.7080078125, 17.29052734375, 17.873046875, 18.45556640625, 19.0380859375, 19.62060546875, 20.203125]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 6.0, 4.0, 12.0, 18.0, 21.0, 24.0, 26.0, 50.0, 82.0, 168.0, 284.0, 630.0, 2392.0, 3122660.0, 17465.0, 959.0, 383.0, 195.0, 117.0, 59.0, 41.0, 29.0, 22.0, 20.0, 7.0, 3.0, 8.0, 8.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-61.25, -59.53466796875, -57.8193359375, -56.10400390625, -54.388671875, -52.67333984375, -50.9580078125, -49.24267578125, -47.52734375, -45.81201171875, -44.0966796875, -42.38134765625, -40.666015625, -38.95068359375, -37.2353515625, -35.52001953125, -33.8046875, -32.08935546875, -30.3740234375, -28.65869140625, -26.943359375, -25.22802734375, -23.5126953125, -21.79736328125, -20.08203125, -18.36669921875, -16.6513671875, -14.93603515625, -13.220703125, -11.50537109375, -9.7900390625, -8.07470703125, -6.359375, -4.64404296875, -2.9287109375, -1.21337890625, 0.501953125, 2.21728515625, 3.9326171875, 5.64794921875, 7.36328125, 9.07861328125, 10.7939453125, 12.50927734375, 14.224609375, 15.93994140625, 17.6552734375, 19.37060546875, 21.0859375, 22.80126953125, 24.5166015625, 26.23193359375, 27.947265625, 29.66259765625, 31.3779296875, 33.09326171875, 34.80859375, 36.52392578125, 38.2392578125, 39.95458984375, 41.669921875, 43.38525390625, 45.1005859375, 46.81591796875, 48.53125]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 7.0, 204.0, 726.0, 76.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.03435516357422, -60.329872131347656, -56.625389099121094, -52.9209098815918, -49.216426849365234, -45.51194381713867, -41.807464599609375, -38.10298156738281, -34.39849853515625, -30.694015502929688, -26.989534378051758, -23.285053253173828, -19.580570220947266, -15.876087188720703, -12.171606063842773, -8.467124938964844, -4.762641906738281, -1.0581598281860352, 2.646322250366211, 6.350804328918457, 10.055286407470703, 13.759769439697266, 17.464250564575195, 21.168731689453125, 24.873214721679688, 28.57769775390625, 32.28218078613281, 35.98666000366211, 39.69114303588867, 43.395626068115234, 47.10010528564453, 50.804588317871094, 54.509063720703125, 58.21354675292969, 61.91802978515625, 65.62251281738281, 69.32699584960938, 73.03147888183594, 76.73595428466797, 80.44043731689453, 84.1449203491211, 87.84940338134766, 91.55388641357422, 95.25836944580078, 98.96284484863281, 102.66732788085938, 106.37181091308594, 110.0762939453125, 113.78077697753906, 117.48526000976562, 121.18974304199219, 124.89422607421875, 128.5987091064453, 132.30319213867188, 136.00767517089844, 139.712158203125, 143.4166259765625, 147.12110900878906, 150.82559204101562, 154.5300750732422, 158.23455810546875, 161.9390411376953, 165.64352416992188, 169.34799194335938, 173.052490234375]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 6.0, 8.0, 8.0, 2.0, 5.0, 9.0, 12.0, 13.0, 18.0, 23.0, 18.0, 22.0, 24.0, 22.0, 28.0, 38.0, 35.0, 46.0, 32.0, 37.0, 42.0, 44.0, 50.0, 43.0, 34.0, 39.0, 35.0, 36.0, 30.0, 36.0, 29.0, 30.0, 30.0, 21.0, 14.0, 15.0, 13.0, 13.0, 11.0, 7.0, 10.0, 3.0, 6.0, 6.0, 2.0, 4.0, 0.0, 1.0, 4.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-34.330711364746094, -33.250938415527344, -32.17116928100586, -31.09139633178711, -30.01162338256836, -28.931852340698242, -27.852081298828125, -26.772308349609375, -25.692535400390625, -24.612764358520508, -23.532991409301758, -22.45322036743164, -21.37344741821289, -20.293676376342773, -19.213905334472656, -18.134132385253906, -17.05436134338379, -15.974589347839355, -14.894817352294922, -13.815046310424805, -12.735273361206055, -11.655502319335938, -10.575730323791504, -9.49595832824707, -8.416186332702637, -7.336414337158203, -6.2566423416137695, -5.176870822906494, -4.0970988273620605, -3.017326831817627, -1.9375553131103516, -0.857783317565918, 0.22198867797851562, 1.3017605543136597, 2.3815324306488037, 3.461304187774658, 4.541076183319092, 5.620848178863525, 6.700619697570801, 7.780391693115234, 8.860163688659668, 9.939935684204102, 11.019707679748535, 12.099479675292969, 13.179250717163086, 14.259023666381836, 15.338794708251953, 16.418567657470703, 17.49833869934082, 18.578109741210938, 19.657882690429688, 20.737653732299805, 21.817426681518555, 22.897197723388672, 23.976970672607422, 25.05674171447754, 26.136512756347656, 27.216283798217773, 28.296056747436523, 29.37582778930664, 30.45560073852539, 31.535371780395508, 32.615142822265625, 33.694915771484375, 34.774688720703125]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 8.0, 6.0, 12.0, 11.0, 8.0, 16.0, 17.0, 18.0, 24.0, 22.0, 23.0, 18.0, 31.0, 41.0, 36.0, 36.0, 44.0, 37.0, 44.0, 46.0, 48.0, 34.0, 29.0, 57.0, 26.0, 36.0, 43.0, 28.0, 25.0, 23.0, 21.0, 30.0, 14.0, 21.0, 11.0, 18.0, 7.0, 4.0, 5.0, 4.0, 10.0, 2.0, 7.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.34375, -7.1334228515625, -6.923095703125, -6.7127685546875, -6.50244140625, -6.2921142578125, -6.081787109375, -5.8714599609375, -5.6611328125, -5.4508056640625, -5.240478515625, -5.0301513671875, -4.81982421875, -4.6094970703125, -4.399169921875, -4.1888427734375, -3.978515625, -3.7681884765625, -3.557861328125, -3.3475341796875, -3.13720703125, -2.9268798828125, -2.716552734375, -2.5062255859375, -2.2958984375, -2.0855712890625, -1.875244140625, -1.6649169921875, -1.45458984375, -1.2442626953125, -1.033935546875, -0.8236083984375, -0.61328125, -0.4029541015625, -0.192626953125, 0.0177001953125, 0.22802734375, 0.4383544921875, 0.648681640625, 0.8590087890625, 1.0693359375, 1.2796630859375, 1.489990234375, 1.7003173828125, 1.91064453125, 2.1209716796875, 2.331298828125, 2.5416259765625, 2.751953125, 2.9622802734375, 3.172607421875, 3.3829345703125, 3.59326171875, 3.8035888671875, 4.013916015625, 4.2242431640625, 4.4345703125, 4.6448974609375, 4.855224609375, 5.0655517578125, 5.27587890625, 5.4862060546875, 5.696533203125, 5.9068603515625, 6.1171875]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [5.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 8.0, 10.0, 14.0, 11.0, 16.0, 22.0, 26.0, 41.0, 35.0, 44.0, 59.0, 60.0, 77.0, 116.0, 156.0, 202.0, 224.0, 360.0, 490.0, 883.0, 1818.0, 6791.0, 81212.0, 3554881.0, 526849.0, 13834.0, 2762.0, 1058.0, 584.0, 403.0, 253.0, 202.0, 164.0, 126.0, 102.0, 79.0, 62.0, 58.0, 41.0, 34.0, 24.0, 14.0, 17.0, 15.0, 10.0, 9.0, 8.0, 7.0, 3.0, 4.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0], "bins": [-33.0625, -32.01904296875, -30.9755859375, -29.93212890625, -28.888671875, -27.84521484375, -26.8017578125, -25.75830078125, -24.71484375, -23.67138671875, -22.6279296875, -21.58447265625, -20.541015625, -19.49755859375, -18.4541015625, -17.41064453125, -16.3671875, -15.32373046875, -14.2802734375, -13.23681640625, -12.193359375, -11.14990234375, -10.1064453125, -9.06298828125, -8.01953125, -6.97607421875, -5.9326171875, -4.88916015625, -3.845703125, -2.80224609375, -1.7587890625, -0.71533203125, 0.328125, 1.37158203125, 2.4150390625, 3.45849609375, 4.501953125, 5.54541015625, 6.5888671875, 7.63232421875, 8.67578125, 9.71923828125, 10.7626953125, 11.80615234375, 12.849609375, 13.89306640625, 14.9365234375, 15.97998046875, 17.0234375, 18.06689453125, 19.1103515625, 20.15380859375, 21.197265625, 22.24072265625, 23.2841796875, 24.32763671875, 25.37109375, 26.41455078125, 27.4580078125, 28.50146484375, 29.544921875, 30.58837890625, 31.6318359375, 32.67529296875, 33.71875]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 3.0, 8.0, 17.0, 25.0, 86.0, 178.0, 488.0, 972.0, 1256.0, 597.0, 245.0, 104.0, 46.0, 16.0, 15.0, 5.0, 9.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-37.78125, -36.9447021484375, -36.108154296875, -35.2716064453125, -34.43505859375, -33.5985107421875, -32.761962890625, -31.9254150390625, -31.0888671875, -30.2523193359375, -29.415771484375, -28.5792236328125, -27.74267578125, -26.9061279296875, -26.069580078125, -25.2330322265625, -24.396484375, -23.5599365234375, -22.723388671875, -21.8868408203125, -21.05029296875, -20.2137451171875, -19.377197265625, -18.5406494140625, -17.7041015625, -16.8675537109375, -16.031005859375, -15.1944580078125, -14.35791015625, -13.5213623046875, -12.684814453125, -11.8482666015625, -11.01171875, -10.1751708984375, -9.338623046875, -8.5020751953125, -7.66552734375, -6.8289794921875, -5.992431640625, -5.1558837890625, -4.3193359375, -3.4827880859375, -2.646240234375, -1.8096923828125, -0.97314453125, -0.1365966796875, 0.699951171875, 1.5364990234375, 2.373046875, 3.2095947265625, 4.046142578125, 4.8826904296875, 5.71923828125, 6.5557861328125, 7.392333984375, 8.2288818359375, 9.0654296875, 9.9019775390625, 10.738525390625, 11.5750732421875, 12.41162109375, 13.2481689453125, 14.084716796875, 14.9212646484375, 15.7578125]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 4.0, 8.0, 15.0, 31.0, 43.0, 45.0, 89.0, 178.0, 535.0, 2273.0, 29930.0, 3812218.0, 340758.0, 6612.0, 933.0, 324.0, 117.0, 71.0, 37.0, 27.0, 16.0, 6.0, 4.0, 6.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-42.0625, -40.9482421875, -39.833984375, -38.7197265625, -37.60546875, -36.4912109375, -35.376953125, -34.2626953125, -33.1484375, -32.0341796875, -30.919921875, -29.8056640625, -28.69140625, -27.5771484375, -26.462890625, -25.3486328125, -24.234375, -23.1201171875, -22.005859375, -20.8916015625, -19.77734375, -18.6630859375, -17.548828125, -16.4345703125, -15.3203125, -14.2060546875, -13.091796875, -11.9775390625, -10.86328125, -9.7490234375, -8.634765625, -7.5205078125, -6.40625, -5.2919921875, -4.177734375, -3.0634765625, -1.94921875, -0.8349609375, 0.279296875, 1.3935546875, 2.5078125, 3.6220703125, 4.736328125, 5.8505859375, 6.96484375, 8.0791015625, 9.193359375, 10.3076171875, 11.421875, 12.5361328125, 13.650390625, 14.7646484375, 15.87890625, 16.9931640625, 18.107421875, 19.2216796875, 20.3359375, 21.4501953125, 22.564453125, 23.6787109375, 24.79296875, 25.9072265625, 27.021484375, 28.1357421875, 29.25]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [3.0, 2.0, 5.0, 2.0, 4.0, 7.0, 19.0, 26.0, 27.0, 70.0, 103.0, 123.0, 128.0, 137.0, 111.0, 83.0, 68.0, 34.0, 21.0, 21.0, 7.0, 5.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.160179138183594, -37.987518310546875, -34.814857482910156, -31.642200469970703, -28.469539642333984, -25.296878814697266, -22.12421989440918, -18.951560974121094, -15.778900146484375, -12.606240272521973, -9.43358039855957, -6.260920524597168, -3.0882606506347656, 0.08439922332763672, 3.257059097290039, 6.429718017578125, 9.602378845214844, 12.775038719177246, 15.947698593139648, 19.120357513427734, 22.293018341064453, 25.465679168701172, 28.638338088989258, 31.810997009277344, 34.98365783691406, 38.15631866455078, 41.3289794921875, 44.50163650512695, 47.67429733276367, 50.84695816040039, 54.019615173339844, 57.19227600097656, 60.36494445800781, 63.53760528564453, 66.71026611328125, 69.88292694091797, 73.05558776855469, 76.22824096679688, 79.4009017944336, 82.57356262207031, 85.74622344970703, 88.91888427734375, 92.09154510498047, 95.26420593261719, 98.43685913085938, 101.6095199584961, 104.78218078613281, 107.95484161376953, 111.12750244140625, 114.30016326904297, 117.47282409667969, 120.6454849243164, 123.81814575195312, 126.99079895019531, 130.16346740722656, 133.33612060546875, 136.5087890625, 139.6814422607422, 142.85411071777344, 146.02676391601562, 149.19943237304688, 152.37208557128906, 155.5447540283203, 158.7174072265625, 161.8900604248047]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 6.0, 5.0, 7.0, 5.0, 4.0, 9.0, 16.0, 20.0, 13.0, 24.0, 18.0, 24.0, 24.0, 34.0, 27.0, 30.0, 31.0, 29.0, 39.0, 34.0, 36.0, 44.0, 44.0, 39.0, 42.0, 35.0, 37.0, 31.0, 28.0, 38.0, 16.0, 31.0, 30.0, 24.0, 18.0, 13.0, 17.0, 13.0, 11.0, 16.0, 6.0, 8.0, 9.0, 3.0, 4.0, 3.0, 2.0, 4.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-40.422119140625, -39.09198760986328, -37.76185989379883, -36.43172836303711, -35.101600646972656, -33.77146911621094, -32.44133758544922, -31.111207962036133, -29.781078338623047, -28.45094871520996, -27.120819091796875, -25.790687561035156, -24.46055793762207, -23.130428314208984, -21.800296783447266, -20.47016716003418, -19.140037536621094, -17.809907913208008, -16.479778289794922, -15.149646759033203, -13.819517135620117, -12.489387512207031, -11.159256935119629, -9.829126358032227, -8.49899673461914, -7.1688666343688965, -5.838736534118652, -4.508606433868408, -3.178476333618164, -1.84834623336792, -0.5182161331176758, 0.8119144439697266, 2.1420440673828125, 3.4721741676330566, 4.802304267883301, 6.132434368133545, 7.462564468383789, 8.792694091796875, 10.122824668884277, 11.45295524597168, 12.783084869384766, 14.113214492797852, 15.443345069885254, 16.773475646972656, 18.103605270385742, 19.433734893798828, 20.763866424560547, 22.093996047973633, 23.42412567138672, 24.754255294799805, 26.08438491821289, 27.41451644897461, 28.744646072387695, 30.07477569580078, 31.4049072265625, 32.73503875732422, 34.06516647338867, 35.39529800415039, 36.725425720214844, 38.05555725097656, 39.38568878173828, 40.715816497802734, 42.04594802856445, 43.376075744628906, 44.706207275390625]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 3.0, 6.0, 3.0, 9.0, 7.0, 5.0, 12.0, 11.0, 16.0, 9.0, 14.0, 13.0, 19.0, 27.0, 36.0, 33.0, 29.0, 28.0, 42.0, 42.0, 39.0, 29.0, 42.0, 44.0, 50.0, 42.0, 40.0, 27.0, 36.0, 29.0, 27.0, 30.0, 28.0, 24.0, 26.0, 17.0, 9.0, 16.0, 19.0, 12.0, 9.0, 8.0, 11.0, 5.0, 4.0, 3.0, 8.0, 5.0, 3.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-75.125, -72.7626953125, -70.400390625, -68.0380859375, -65.67578125, -63.3134765625, -60.951171875, -58.5888671875, -56.2265625, -53.8642578125, -51.501953125, -49.1396484375, -46.77734375, -44.4150390625, -42.052734375, -39.6904296875, -37.328125, -34.9658203125, -32.603515625, -30.2412109375, -27.87890625, -25.5166015625, -23.154296875, -20.7919921875, -18.4296875, -16.0673828125, -13.705078125, -11.3427734375, -8.98046875, -6.6181640625, -4.255859375, -1.8935546875, 0.46875, 2.8310546875, 5.193359375, 7.5556640625, 9.91796875, 12.2802734375, 14.642578125, 17.0048828125, 19.3671875, 21.7294921875, 24.091796875, 26.4541015625, 28.81640625, 31.1787109375, 33.541015625, 35.9033203125, 38.265625, 40.6279296875, 42.990234375, 45.3525390625, 47.71484375, 50.0771484375, 52.439453125, 54.8017578125, 57.1640625, 59.5263671875, 61.888671875, 64.2509765625, 66.61328125, 68.9755859375, 71.337890625, 73.7001953125, 76.0625]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 8.0, 4.0, 13.0, 14.0, 28.0, 37.0, 66.0, 104.0, 159.0, 246.0, 406.0, 572.0, 929.0, 1429.0, 2098.0, 3379.0, 5069.0, 7840.0, 12261.0, 18763.0, 29532.0, 46597.0, 72496.0, 108444.0, 148386.0, 167116.0, 140643.0, 99082.0, 65315.0, 42101.0, 26727.0, 17218.0, 11175.0, 7108.0, 4573.0, 3042.0, 1982.0, 1272.0, 808.0, 547.0, 368.0, 223.0, 152.0, 90.0, 53.0, 36.0, 26.0, 11.0, 7.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-6.0625, -5.88092041015625, -5.6993408203125, -5.51776123046875, -5.336181640625, -5.15460205078125, -4.9730224609375, -4.79144287109375, -4.60986328125, -4.42828369140625, -4.2467041015625, -4.06512451171875, -3.883544921875, -3.70196533203125, -3.5203857421875, -3.33880615234375, -3.1572265625, -2.97564697265625, -2.7940673828125, -2.61248779296875, -2.430908203125, -2.24932861328125, -2.0677490234375, -1.88616943359375, -1.70458984375, -1.52301025390625, -1.3414306640625, -1.15985107421875, -0.978271484375, -0.79669189453125, -0.6151123046875, -0.43353271484375, -0.251953125, -0.07037353515625, 0.1112060546875, 0.29278564453125, 0.474365234375, 0.65594482421875, 0.8375244140625, 1.01910400390625, 1.20068359375, 1.38226318359375, 1.5638427734375, 1.74542236328125, 1.927001953125, 2.10858154296875, 2.2901611328125, 2.47174072265625, 2.6533203125, 2.83489990234375, 3.0164794921875, 3.19805908203125, 3.379638671875, 3.56121826171875, 3.7427978515625, 3.92437744140625, 4.10595703125, 4.28753662109375, 4.4691162109375, 4.65069580078125, 4.832275390625, 5.01385498046875, 5.1954345703125, 5.37701416015625, 5.55859375]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 4.0, 8.0, 4.0, 11.0, 9.0, 8.0, 15.0, 27.0, 24.0, 25.0, 25.0, 24.0, 29.0, 26.0, 36.0, 41.0, 55.0, 30.0, 42.0, 49.0, 1066.0, 43.0, 39.0, 35.0, 30.0, 22.0, 46.0, 38.0, 33.0, 24.0, 26.0, 18.0, 11.0, 20.0, 15.0, 12.0, 10.0, 7.0, 11.0, 8.0, 6.0, 3.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-52.875, -51.2802734375, -49.685546875, -48.0908203125, -46.49609375, -44.9013671875, -43.306640625, -41.7119140625, -40.1171875, -38.5224609375, -36.927734375, -35.3330078125, -33.73828125, -32.1435546875, -30.548828125, -28.9541015625, -27.359375, -25.7646484375, -24.169921875, -22.5751953125, -20.98046875, -19.3857421875, -17.791015625, -16.1962890625, -14.6015625, -13.0068359375, -11.412109375, -9.8173828125, -8.22265625, -6.6279296875, -5.033203125, -3.4384765625, -1.84375, -0.2490234375, 1.345703125, 2.9404296875, 4.53515625, 6.1298828125, 7.724609375, 9.3193359375, 10.9140625, 12.5087890625, 14.103515625, 15.6982421875, 17.29296875, 18.8876953125, 20.482421875, 22.0771484375, 23.671875, 25.2666015625, 26.861328125, 28.4560546875, 30.05078125, 31.6455078125, 33.240234375, 34.8349609375, 36.4296875, 38.0244140625, 39.619140625, 41.2138671875, 42.80859375, 44.4033203125, 45.998046875, 47.5927734375, 49.1875]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 1.0, 9.0, 7.0, 17.0, 28.0, 35.0, 57.0, 74.0, 119.0, 196.0, 314.0, 503.0, 693.0, 1133.0, 1799.0, 2854.0, 4552.0, 7190.0, 11324.0, 17975.0, 28865.0, 46365.0, 73301.0, 112166.0, 153878.0, 1216529.0, 142627.0, 100577.0, 64647.0, 40615.0, 25373.0, 15975.0, 9990.0, 6432.0, 4018.0, 2628.0, 1563.0, 955.0, 615.0, 380.0, 271.0, 150.0, 114.0, 83.0, 53.0, 34.0, 16.0, 15.0, 5.0, 4.0, 3.0, 5.0, 1.0, 1.0, 4.0, 2.0, 0.0, 1.0], "bins": [-5.640625, -5.46075439453125, -5.2808837890625, -5.10101318359375, -4.921142578125, -4.74127197265625, -4.5614013671875, -4.38153076171875, -4.20166015625, -4.02178955078125, -3.8419189453125, -3.66204833984375, -3.482177734375, -3.30230712890625, -3.1224365234375, -2.94256591796875, -2.7626953125, -2.58282470703125, -2.4029541015625, -2.22308349609375, -2.043212890625, -1.86334228515625, -1.6834716796875, -1.50360107421875, -1.32373046875, -1.14385986328125, -0.9639892578125, -0.78411865234375, -0.604248046875, -0.42437744140625, -0.2445068359375, -0.06463623046875, 0.115234375, 0.29510498046875, 0.4749755859375, 0.65484619140625, 0.834716796875, 1.01458740234375, 1.1944580078125, 1.37432861328125, 1.55419921875, 1.73406982421875, 1.9139404296875, 2.09381103515625, 2.273681640625, 2.45355224609375, 2.6334228515625, 2.81329345703125, 2.9931640625, 3.17303466796875, 3.3529052734375, 3.53277587890625, 3.712646484375, 3.89251708984375, 4.0723876953125, 4.25225830078125, 4.43212890625, 4.61199951171875, 4.7918701171875, 4.97174072265625, 5.151611328125, 5.33148193359375, 5.5113525390625, 5.69122314453125, 5.87109375]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 3.0, 5.0, 6.0, 6.0, 6.0, 6.0, 9.0, 10.0, 10.0, 20.0, 13.0, 22.0, 47.0, 23.0, 37.0, 44.0, 47.0, 70.0, 69.0, 70.0, 74.0, 62.0, 54.0, 52.0, 44.0, 28.0, 28.0, 27.0, 26.0, 14.0, 11.0, 9.0, 13.0, 8.0, 1.0, 5.0, 0.0, 5.0, 4.0, 2.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.04443359375, -0.042922019958496094, -0.04141044616699219, -0.03989887237548828, -0.038387298583984375, -0.03687572479248047, -0.03536415100097656, -0.033852577209472656, -0.03234100341796875, -0.030829429626464844, -0.029317855834960938, -0.02780628204345703, -0.026294708251953125, -0.02478313446044922, -0.023271560668945312, -0.021759986877441406, -0.0202484130859375, -0.018736839294433594, -0.017225265502929688, -0.01571369171142578, -0.014202117919921875, -0.012690544128417969, -0.011178970336914062, -0.009667396545410156, -0.00815582275390625, -0.006644248962402344, -0.0051326751708984375, -0.0036211013793945312, -0.002109527587890625, -0.0005979537963867188, 0.0009136199951171875, 0.0024251937866210938, 0.003936767578125, 0.005448341369628906, 0.0069599151611328125, 0.008471488952636719, 0.009983062744140625, 0.011494636535644531, 0.013006210327148438, 0.014517784118652344, 0.01602935791015625, 0.017540931701660156, 0.019052505493164062, 0.02056407928466797, 0.022075653076171875, 0.02358722686767578, 0.025098800659179688, 0.026610374450683594, 0.0281219482421875, 0.029633522033691406, 0.031145095825195312, 0.03265666961669922, 0.034168243408203125, 0.03567981719970703, 0.03719139099121094, 0.038702964782714844, 0.04021453857421875, 0.041726112365722656, 0.04323768615722656, 0.04474925994873047, 0.046260833740234375, 0.04777240753173828, 0.04928398132324219, 0.050795555114746094, 0.05230712890625]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 6.0, 3.0, 5.0, 11.0, 9.0, 11.0, 18.0, 17.0, 21.0, 31.0, 50.0, 55.0, 70.0, 96.0, 133.0, 171.0, 204.0, 337.0, 590.0, 978.0, 1908.0, 4782.0, 14837.0, 56362.0, 258210.0, 515524.0, 144019.0, 33524.0, 9401.0, 3306.0, 1484.0, 791.0, 458.0, 312.0, 179.0, 145.0, 131.0, 86.0, 68.0, 54.0, 34.0, 36.0, 22.0, 10.0, 16.0, 11.0, 8.0, 5.0, 10.0, 2.0, 4.0, 3.0, 0.0, 4.0, 1.0], "bins": [-0.31689453125, -0.3076591491699219, -0.29842376708984375, -0.2891883850097656, -0.2799530029296875, -0.2707176208496094, -0.26148223876953125, -0.2522468566894531, -0.243011474609375, -0.23377609252929688, -0.22454071044921875, -0.21530532836914062, -0.2060699462890625, -0.19683456420898438, -0.18759918212890625, -0.17836380004882812, -0.16912841796875, -0.15989303588867188, -0.15065765380859375, -0.14142227172851562, -0.1321868896484375, -0.12295150756835938, -0.11371612548828125, -0.10448074340820312, -0.095245361328125, -0.08600997924804688, -0.07677459716796875, -0.06753921508789062, -0.0583038330078125, -0.049068450927734375, -0.03983306884765625, -0.030597686767578125, -0.0213623046875, -0.012126922607421875, -0.00289154052734375, 0.006343841552734375, 0.0155792236328125, 0.024814605712890625, 0.03404998779296875, 0.043285369873046875, 0.052520751953125, 0.061756134033203125, 0.07099151611328125, 0.08022689819335938, 0.0894622802734375, 0.09869766235351562, 0.10793304443359375, 0.11716842651367188, 0.12640380859375, 0.13563919067382812, 0.14487457275390625, 0.15410995483398438, 0.1633453369140625, 0.17258071899414062, 0.18181610107421875, 0.19105148315429688, 0.200286865234375, 0.20952224731445312, 0.21875762939453125, 0.22799301147460938, 0.2372283935546875, 0.24646377563476562, 0.25569915771484375, 0.2649345397949219, 0.274169921875]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 10.0, 37.0, 55.0, 102.0, 175.0, 196.0, 144.0, 99.0, 70.0, 39.0, 24.0, 12.0, 14.0, 6.0, 9.0, 3.0, 1.0, 3.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.04953237250447273, -0.04664928838610649, -0.04376620054244995, -0.04088311642408371, -0.03800003230571747, -0.03511694818735123, -0.03223386034369469, -0.029350776225328445, -0.026467690244317055, -0.023584604263305664, -0.020701520144939423, -0.017818434163928032, -0.014935349114239216, -0.0120522640645504, -0.009169178083539009, -0.006286093965172768, -0.003403007984161377, -0.0005199227016419172, 0.0023631625808775425, 0.005246248096227646, 0.008129333145916462, 0.011012418195605278, 0.013895504176616669, 0.01677858829498291, 0.0196616742759943, 0.02254476025700569, 0.025427844375371933, 0.028310930356383324, 0.031194016337394714, 0.034077100455760956, 0.0369601845741272, 0.03984326869249344, 0.04272636026144028, 0.04560944437980652, 0.04849253222346306, 0.0513756163418293, 0.05425870046019554, 0.05714178830385208, 0.06002487242221832, 0.06290795654058456, 0.0657910406589508, 0.06867412477731705, 0.07155720889568329, 0.07444030046463013, 0.07732338458299637, 0.08020646870136261, 0.08308955281972885, 0.08597263693809509, 0.08885572850704193, 0.09173881262540817, 0.09462189674377441, 0.09750498831272125, 0.1003880724310875, 0.10327115654945374, 0.10615424066781998, 0.10903732478618622, 0.11192040890455246, 0.1148034930229187, 0.11768657714128494, 0.12056966125965118, 0.12345275282859802, 0.12633582949638367, 0.1292189210653305, 0.13210201263427734, 0.134985089302063]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 5.0, 10.0, 4.0, 5.0, 10.0, 7.0, 8.0, 12.0, 12.0, 18.0, 23.0, 11.0, 10.0, 27.0, 23.0, 28.0, 38.0, 37.0, 31.0, 40.0, 32.0, 29.0, 51.0, 34.0, 37.0, 44.0, 25.0, 43.0, 47.0, 28.0, 39.0, 30.0, 23.0, 26.0, 22.0, 24.0, 21.0, 17.0, 20.0, 9.0, 12.0, 7.0, 9.0, 5.0, 7.0, 1.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.03220796585083008, -0.03122302144765854, -0.03023807890713215, -0.02925313636660576, -0.02826819196343422, -0.02728324756026268, -0.02629830501973629, -0.0253133624792099, -0.02432841807603836, -0.02334347367286682, -0.02235853113234043, -0.02137358859181404, -0.020388644188642502, -0.019403699785470963, -0.018418757244944572, -0.017433814704418182, -0.016448870301246643, -0.015463926829397678, -0.014478983357548714, -0.013494039885699749, -0.012509096413850784, -0.01152415294200182, -0.010539209470152855, -0.00955426599830389, -0.008569322526454926, -0.007584379054605961, -0.006599435582756996, -0.0056144921109080315, -0.004629548639059067, -0.003644605167210102, -0.0026596616953611374, -0.0016747182235121727, -0.000689774751663208, 0.0002951687201857567, 0.0012801121920347214, 0.002265055663883686, 0.0032499991357326508, 0.0042349426075816154, 0.00521988607943058, 0.006204829551279545, 0.0071897730231285095, 0.008174716494977474, 0.009159659966826439, 0.010144603438675404, 0.011129546910524368, 0.012114490382373333, 0.013099433854222298, 0.014084377326071262, 0.015069320797920227, 0.016054265201091766, 0.017039207741618156, 0.018024150282144547, 0.019009094685316086, 0.019994039088487625, 0.020978981629014015, 0.021963924169540405, 0.022948868572711945, 0.023933812975883484, 0.024918755516409874, 0.025903698056936264, 0.026888642460107803, 0.027873586863279343, 0.028858529403805733, 0.029843471944332123, 0.030828416347503662]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 3.0, 6.0, 3.0, 9.0, 6.0, 6.0, 12.0, 11.0, 16.0, 9.0, 14.0, 13.0, 20.0, 27.0, 37.0, 30.0, 29.0, 29.0, 41.0, 43.0, 39.0, 30.0, 43.0, 42.0, 49.0, 42.0, 41.0, 26.0, 37.0, 28.0, 29.0, 31.0, 26.0, 24.0, 23.0, 19.0, 10.0, 16.0, 20.0, 11.0, 9.0, 9.0, 10.0, 4.0, 5.0, 3.0, 9.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-75.0625, -72.7021484375, -70.341796875, -67.9814453125, -65.62109375, -63.2607421875, -60.900390625, -58.5400390625, -56.1796875, -53.8193359375, -51.458984375, -49.0986328125, -46.73828125, -44.3779296875, -42.017578125, -39.6572265625, -37.296875, -34.9365234375, -32.576171875, -30.2158203125, -27.85546875, -25.4951171875, -23.134765625, -20.7744140625, -18.4140625, -16.0537109375, -13.693359375, -11.3330078125, -8.97265625, -6.6123046875, -4.251953125, -1.8916015625, 0.46875, 2.8291015625, 5.189453125, 7.5498046875, 9.91015625, 12.2705078125, 14.630859375, 16.9912109375, 19.3515625, 21.7119140625, 24.072265625, 26.4326171875, 28.79296875, 31.1533203125, 33.513671875, 35.8740234375, 38.234375, 40.5947265625, 42.955078125, 45.3154296875, 47.67578125, 50.0361328125, 52.396484375, 54.7568359375, 57.1171875, 59.4775390625, 61.837890625, 64.1982421875, 66.55859375, 68.9189453125, 71.279296875, 73.6396484375, 76.0]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 5.0, 11.0, 5.0, 11.0, 17.0, 19.0, 24.0, 39.0, 45.0, 77.0, 88.0, 177.0, 253.0, 373.0, 689.0, 1233.0, 2272.0, 4740.0, 11699.0, 37529.0, 180240.0, 593883.0, 160095.0, 34364.0, 11073.0, 4484.0, 2155.0, 1191.0, 621.0, 400.0, 214.0, 161.0, 102.0, 83.0, 52.0, 27.0, 21.0, 26.0, 13.0, 17.0, 6.0, 6.0, 6.0, 2.0, 5.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.078125, -16.517578125, -15.95703125, -15.396484375, -14.8359375, -14.275390625, -13.71484375, -13.154296875, -12.59375, -12.033203125, -11.47265625, -10.912109375, -10.3515625, -9.791015625, -9.23046875, -8.669921875, -8.109375, -7.548828125, -6.98828125, -6.427734375, -5.8671875, -5.306640625, -4.74609375, -4.185546875, -3.625, -3.064453125, -2.50390625, -1.943359375, -1.3828125, -0.822265625, -0.26171875, 0.298828125, 0.859375, 1.419921875, 1.98046875, 2.541015625, 3.1015625, 3.662109375, 4.22265625, 4.783203125, 5.34375, 5.904296875, 6.46484375, 7.025390625, 7.5859375, 8.146484375, 8.70703125, 9.267578125, 9.828125, 10.388671875, 10.94921875, 11.509765625, 12.0703125, 12.630859375, 13.19140625, 13.751953125, 14.3125, 14.873046875, 15.43359375, 15.994140625, 16.5546875, 17.115234375, 17.67578125, 18.236328125, 18.796875]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 6.0, 7.0, 7.0, 12.0, 11.0, 28.0, 29.0, 28.0, 36.0, 48.0, 56.0, 58.0, 72.0, 87.0, 2128.0, 75.0, 79.0, 54.0, 41.0, 39.0, 26.0, 25.0, 19.0, 15.0, 12.0, 7.0, 9.0, 10.0, 5.0, 5.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-175.5, -168.85546875, -162.2109375, -155.56640625, -148.921875, -142.27734375, -135.6328125, -128.98828125, -122.34375, -115.69921875, -109.0546875, -102.41015625, -95.765625, -89.12109375, -82.4765625, -75.83203125, -69.1875, -62.54296875, -55.8984375, -49.25390625, -42.609375, -35.96484375, -29.3203125, -22.67578125, -16.03125, -9.38671875, -2.7421875, 3.90234375, 10.546875, 17.19140625, 23.8359375, 30.48046875, 37.125, 43.76953125, 50.4140625, 57.05859375, 63.703125, 70.34765625, 76.9921875, 83.63671875, 90.28125, 96.92578125, 103.5703125, 110.21484375, 116.859375, 123.50390625, 130.1484375, 136.79296875, 143.4375, 150.08203125, 156.7265625, 163.37109375, 170.015625, 176.66015625, 183.3046875, 189.94921875, 196.59375, 203.23828125, 209.8828125, 216.52734375, 223.171875, 229.81640625, 236.4609375, 243.10546875, 249.75]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 4.0, 4.0, 4.0, 4.0, 0.0, 8.0, 8.0, 13.0, 17.0, 11.0, 28.0, 36.0, 52.0, 81.0, 98.0, 194.0, 242.0, 409.0, 872.0, 2214.0, 9776.0, 165203.0, 2922826.0, 36072.0, 4461.0, 1384.0, 683.0, 351.0, 192.0, 143.0, 89.0, 70.0, 41.0, 27.0, 27.0, 22.0, 8.0, 10.0, 4.0, 7.0, 5.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0], "bins": [-50.84375, -49.44189453125, -48.0400390625, -46.63818359375, -45.236328125, -43.83447265625, -42.4326171875, -41.03076171875, -39.62890625, -38.22705078125, -36.8251953125, -35.42333984375, -34.021484375, -32.61962890625, -31.2177734375, -29.81591796875, -28.4140625, -27.01220703125, -25.6103515625, -24.20849609375, -22.806640625, -21.40478515625, -20.0029296875, -18.60107421875, -17.19921875, -15.79736328125, -14.3955078125, -12.99365234375, -11.591796875, -10.18994140625, -8.7880859375, -7.38623046875, -5.984375, -4.58251953125, -3.1806640625, -1.77880859375, -0.376953125, 1.02490234375, 2.4267578125, 3.82861328125, 5.23046875, 6.63232421875, 8.0341796875, 9.43603515625, 10.837890625, 12.23974609375, 13.6416015625, 15.04345703125, 16.4453125, 17.84716796875, 19.2490234375, 20.65087890625, 22.052734375, 23.45458984375, 24.8564453125, 26.25830078125, 27.66015625, 29.06201171875, 30.4638671875, 31.86572265625, 33.267578125, 34.66943359375, 36.0712890625, 37.47314453125, 38.875]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 7.0, 16.0, 31.0, 142.0, 460.0, 242.0, 76.0, 22.0, 8.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-918.1880493164062, -899.7416381835938, -881.2952270507812, -862.8488159179688, -844.4024658203125, -825.9560546875, -807.5096435546875, -789.063232421875, -770.6168212890625, -752.17041015625, -733.7239990234375, -715.277587890625, -696.8311767578125, -678.3848266601562, -659.9384155273438, -641.4920043945312, -623.0455932617188, -604.5991821289062, -586.1527709960938, -567.7063598632812, -549.260009765625, -530.8135986328125, -512.3671875, -493.9207763671875, -475.474365234375, -457.0279541015625, -438.58154296875, -420.1351623535156, -401.6887512207031, -383.2423400878906, -364.79595947265625, -346.34954833984375, -327.9031677246094, -309.4567565917969, -291.0103759765625, -272.56396484375, -254.1175537109375, -235.671142578125, -217.22474670410156, -198.77835083007812, -180.33193969726562, -161.88552856445312, -143.4391326904297, -124.99272918701172, -106.54632568359375, -88.09992218017578, -69.65351867675781, -51.207122802734375, -32.760711669921875, -14.314308166503906, 4.1320953369140625, 22.57849884033203, 41.02490234375, 59.47130584716797, 77.91770935058594, 96.36410522460938, 114.81051635742188, 133.25692749023438, 151.7033233642578, 170.14971923828125, 188.59613037109375, 207.04254150390625, 225.4889373779297, 243.93533325195312, 262.3817443847656]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 6.0, 3.0, 2.0, 1.0, 3.0, 2.0, 6.0, 13.0, 15.0, 8.0, 25.0, 15.0, 22.0, 33.0, 29.0, 30.0, 34.0, 38.0, 49.0, 40.0, 51.0, 61.0, 55.0, 46.0, 62.0, 57.0, 44.0, 37.0, 44.0, 33.0, 24.0, 23.0, 18.0, 14.0, 16.0, 8.0, 13.0, 9.0, 2.0, 4.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-227.23028564453125, -220.158935546875, -213.08758544921875, -206.01622009277344, -198.9448699951172, -191.87351989746094, -184.80215454101562, -177.73080444335938, -170.65945434570312, -163.58810424804688, -156.51675415039062, -149.4453887939453, -142.37403869628906, -135.3026885986328, -128.2313232421875, -121.15997314453125, -114.088623046875, -107.01727294921875, -99.94591522216797, -92.87455749511719, -85.80320739746094, -78.73185729980469, -71.6604995727539, -64.58914184570312, -57.517791748046875, -50.44643783569336, -43.375083923339844, -36.30373001098633, -29.232376098632812, -22.161022186279297, -15.089668273925781, -8.018314361572266, -0.94696044921875, 6.124393463134766, 13.195747375488281, 20.267101287841797, 27.338455200195312, 34.40980911254883, 41.481163024902344, 48.55251693725586, 55.623870849609375, 62.69522476196289, 69.7665786743164, 76.83793640136719, 83.90928649902344, 90.98063659667969, 98.05199432373047, 105.12335205078125, 112.1947021484375, 119.26605224609375, 126.33740997314453, 133.4087677001953, 140.48011779785156, 147.5514678955078, 154.62283325195312, 161.69418334960938, 168.76553344726562, 175.83688354492188, 182.90823364257812, 189.97959899902344, 197.0509490966797, 204.12229919433594, 211.19366455078125, 218.2650146484375, 225.33636474609375]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 4.0, 3.0, 8.0, 7.0, 9.0, 8.0, 9.0, 11.0, 11.0, 22.0, 41.0, 39.0, 61.0, 71.0, 89.0, 122.0, 194.0, 245.0, 342.0, 435.0, 602.0, 744.0, 1239.0, 1040828.0, 802.0, 677.0, 506.0, 347.0, 305.0, 194.0, 146.0, 116.0, 75.0, 61.0, 40.0, 40.0, 24.0, 20.0, 14.0, 18.0, 12.0, 9.0, 7.0, 5.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.662567138671875, -42.0578727722168, -40.453182220458984, -38.848487854003906, -37.243797302246094, -35.639102935791016, -34.03440856933594, -32.429718017578125, -30.82502555847168, -29.220333099365234, -27.61564064025879, -26.010948181152344, -24.406253814697266, -22.801563262939453, -21.196868896484375, -19.59217643737793, -17.987483978271484, -16.38279151916504, -14.778099060058594, -13.173405647277832, -11.568713188171387, -9.964020729064941, -8.35932731628418, -6.754634857177734, -5.149942398071289, -3.5452497005462646, -1.9405570030212402, -0.3358640670776367, 1.2688283920288086, 2.873520851135254, 4.478214263916016, 6.082906723022461, 7.687602996826172, 9.292295455932617, 10.896987915039062, 12.501681327819824, 14.10637378692627, 15.711066246032715, 17.315759658813477, 18.920452117919922, 20.525144577026367, 22.129837036132812, 23.734529495239258, 25.339221954345703, 26.94391632080078, 28.548606872558594, 30.153301239013672, 31.757993698120117, 33.36268615722656, 34.96738052368164, 36.57207107543945, 38.17676544189453, 39.781455993652344, 41.38615036010742, 42.9908447265625, 44.59553527832031, 46.200225830078125, 47.8049201965332, 49.409610748291016, 51.014305114746094, 52.618995666503906, 54.223690032958984, 55.82838439941406, 57.433074951171875, 59.03776931762695]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 6.0, 5.0, 14.0, 14.0, 14.0, 21.0, 63.0, 447.0, 51462376.0, 120.0, 20.0, 14.0, 8.0, 8.0, 4.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3986.817138671875, -3800.021240234375, -3613.225341796875, -3426.4296875, -3239.6337890625, -3052.837890625, -2866.0419921875, -2679.24609375, -2492.4501953125, -2305.654296875, -2118.8583984375, -1932.0626220703125, -1745.2667236328125, -1558.4708251953125, -1371.675048828125, -1184.879150390625, -998.083251953125, -811.287353515625, -624.4915161132812, -437.6956787109375, -250.8997802734375, -64.1038818359375, 122.69189453125, 309.48779296875, 496.28369140625, 683.07958984375, 869.8754272460938, 1056.6712646484375, 1243.4671630859375, 1430.2630615234375, 1617.058837890625, 1803.854736328125, 1990.650390625, 2177.4462890625, 2364.2421875, 2551.0380859375, 2737.833984375, 2924.6298828125, 3111.425537109375, 3298.221435546875, 3485.017333984375, 3671.813232421875, 3858.609130859375, 4045.40478515625, 4232.20068359375, 4418.99658203125, 4605.79248046875, 4792.58837890625, 4979.38427734375, 5166.18017578125, 5352.97607421875, 5539.77197265625, 5726.56787109375, 5913.36376953125, 6100.1591796875, 6286.955078125, 6473.7509765625, 6660.546875, 6847.3427734375, 7034.138671875, 7220.9345703125, 7407.73046875, 7594.5263671875, 7781.322265625, 7968.1181640625]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 2.0, 7.0, 9.0, 13.0, 27.0, 37.0, 49.0, 70.0, 100.0, 133.0, 213.0, 350.0, 514.0, 769.0, 1206.0, 1771.0, 2622.0, 3765.0, 5422.0, 8543.0, 12433.0, 18256.0, 27801.0, 41151.0, 60176.0, 89086.0, 129959.0, 185002.0, 254876.0, 332189.0, 1713375.0, 2200863.0, 338229.0, 260509.0, 188864.0, 131972.0, 91061.0, 61354.0, 42275.0, 28225.0, 19191.0, 12790.0, 8643.0, 5723.0, 3904.0, 2545.0, 1769.0, 1220.0, 815.0, 558.0, 354.0, 225.0, 157.0, 90.0, 70.0, 46.0, 36.0, 15.0, 11.0, 6.0, 4.0, 2.0, 2.0], "bins": [-1.7490234375, -1.6944122314453125, -1.639801025390625, -1.5851898193359375, -1.53057861328125, -1.4759674072265625, -1.421356201171875, -1.3667449951171875, -1.3121337890625, -1.2575225830078125, -1.202911376953125, -1.1483001708984375, -1.09368896484375, -1.0390777587890625, -0.984466552734375, -0.9298553466796875, -0.875244140625, -0.8206329345703125, -0.766021728515625, -0.7114105224609375, -0.65679931640625, -0.6021881103515625, -0.547576904296875, -0.4929656982421875, -0.4383544921875, -0.3837432861328125, -0.329132080078125, -0.2745208740234375, -0.21990966796875, -0.1652984619140625, -0.110687255859375, -0.0560760498046875, -0.00146484375, 0.0531463623046875, 0.107757568359375, 0.1623687744140625, 0.21697998046875, 0.2715911865234375, 0.326202392578125, 0.3808135986328125, 0.4354248046875, 0.4900360107421875, 0.544647216796875, 0.5992584228515625, 0.65386962890625, 0.7084808349609375, 0.763092041015625, 0.8177032470703125, 0.872314453125, 0.9269256591796875, 0.981536865234375, 1.0361480712890625, 1.09075927734375, 1.1453704833984375, 1.199981689453125, 1.2545928955078125, 1.3092041015625, 1.3638153076171875, 1.418426513671875, 1.4730377197265625, 1.52764892578125, 1.5822601318359375, 1.636871337890625, 1.6914825439453125, 1.74609375]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 5.0, 2.0, 3.0, 1.0, 4.0, 4.0, 10.0, 10.0, 6.0, 17.0, 16.0, 17.0, 16.0, 24.0, 20.0, 27.0, 33.0, 35.0, 32.0, 28.0, 40.0, 46.0, 50.0, 70.0, 836.0, 231.0, 36.0, 35.0, 39.0, 40.0, 37.0, 31.0, 36.0, 27.0, 25.0, 31.0, 19.0, 11.0, 13.0, 19.0, 11.0, 8.0, 9.0, 9.0, 7.0, 5.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-15.7734375, -15.2247314453125, -14.676025390625, -14.1273193359375, -13.57861328125, -13.0299072265625, -12.481201171875, -11.9324951171875, -11.3837890625, -10.8350830078125, -10.286376953125, -9.7376708984375, -9.18896484375, -8.6402587890625, -8.091552734375, -7.5428466796875, -6.994140625, -6.4454345703125, -5.896728515625, -5.3480224609375, -4.79931640625, -4.2506103515625, -3.701904296875, -3.1531982421875, -2.6044921875, -2.0557861328125, -1.507080078125, -0.9583740234375, -0.40966796875, 0.1390380859375, 0.687744140625, 1.2364501953125, 1.78515625, 2.3338623046875, 2.882568359375, 3.4312744140625, 3.97998046875, 4.5286865234375, 5.077392578125, 5.6260986328125, 6.1748046875, 6.7235107421875, 7.272216796875, 7.8209228515625, 8.36962890625, 8.9183349609375, 9.467041015625, 10.0157470703125, 10.564453125, 11.1131591796875, 11.661865234375, 12.2105712890625, 12.75927734375, 13.3079833984375, 13.856689453125, 14.4053955078125, 14.9541015625, 15.5028076171875, 16.051513671875, 16.6002197265625, 17.14892578125, 17.6976318359375, 18.246337890625, 18.7950439453125, 19.34375]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [3.0, 4.0, 5.0, 12.0, 6.0, 12.0, 22.0, 29.0, 51.0, 78.0, 114.0, 185.0, 254.0, 424.0, 682.0, 989.0, 1596.0, 2346.0, 3884.0, 6258.0, 9752.0, 15404.0, 24459.0, 40082.0, 63522.0, 101047.0, 159392.0, 238721.0, 339788.0, 600532.0, 3405163.0, 412485.0, 300125.0, 204884.0, 134118.0, 84283.0, 52967.0, 32496.0, 20471.0, 12875.0, 7941.0, 5065.0, 3166.0, 1998.0, 1298.0, 838.0, 571.0, 355.0, 250.0, 153.0, 95.0, 70.0, 48.0, 32.0, 18.0, 16.0, 8.0, 5.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0], "bins": [-1.9287109375, -1.8650665283203125, -1.801422119140625, -1.7377777099609375, -1.67413330078125, -1.6104888916015625, -1.546844482421875, -1.4832000732421875, -1.4195556640625, -1.3559112548828125, -1.292266845703125, -1.2286224365234375, -1.16497802734375, -1.1013336181640625, -1.037689208984375, -0.9740447998046875, -0.910400390625, -0.8467559814453125, -0.783111572265625, -0.7194671630859375, -0.65582275390625, -0.5921783447265625, -0.528533935546875, -0.4648895263671875, -0.4012451171875, -0.3376007080078125, -0.273956298828125, -0.2103118896484375, -0.14666748046875, -0.0830230712890625, -0.019378662109375, 0.0442657470703125, 0.10791015625, 0.1715545654296875, 0.235198974609375, 0.2988433837890625, 0.36248779296875, 0.4261322021484375, 0.489776611328125, 0.5534210205078125, 0.6170654296875, 0.6807098388671875, 0.744354248046875, 0.8079986572265625, 0.87164306640625, 0.9352874755859375, 0.998931884765625, 1.0625762939453125, 1.126220703125, 1.1898651123046875, 1.253509521484375, 1.3171539306640625, 1.38079833984375, 1.4444427490234375, 1.508087158203125, 1.5717315673828125, 1.6353759765625, 1.6990203857421875, 1.762664794921875, 1.8263092041015625, 1.88995361328125, 1.9535980224609375, 2.017242431640625, 2.0808868408203125, 2.14453125]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 7.0, 7.0, 4.0, 9.0, 10.0, 6.0, 12.0, 15.0, 12.0, 25.0, 15.0, 28.0, 20.0, 20.0, 36.0, 31.0, 37.0, 33.0, 33.0, 34.0, 42.0, 68.0, 738.0, 314.0, 40.0, 34.0, 48.0, 35.0, 44.0, 30.0, 30.0, 23.0, 22.0, 18.0, 23.0, 22.0, 14.0, 14.0, 12.0, 10.0, 15.0, 13.0, 5.0, 8.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0], "bins": [-12.7734375, -12.384521484375, -11.99560546875, -11.606689453125, -11.2177734375, -10.828857421875, -10.43994140625, -10.051025390625, -9.662109375, -9.273193359375, -8.88427734375, -8.495361328125, -8.1064453125, -7.717529296875, -7.32861328125, -6.939697265625, -6.55078125, -6.161865234375, -5.77294921875, -5.384033203125, -4.9951171875, -4.606201171875, -4.21728515625, -3.828369140625, -3.439453125, -3.050537109375, -2.66162109375, -2.272705078125, -1.8837890625, -1.494873046875, -1.10595703125, -0.717041015625, -0.328125, 0.060791015625, 0.44970703125, 0.838623046875, 1.2275390625, 1.616455078125, 2.00537109375, 2.394287109375, 2.783203125, 3.172119140625, 3.56103515625, 3.949951171875, 4.3388671875, 4.727783203125, 5.11669921875, 5.505615234375, 5.89453125, 6.283447265625, 6.67236328125, 7.061279296875, 7.4501953125, 7.839111328125, 8.22802734375, 8.616943359375, 9.005859375, 9.394775390625, 9.78369140625, 10.172607421875, 10.5615234375, 10.950439453125, 11.33935546875, 11.728271484375, 12.1171875]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [1.0, 3.0, 6.0, 2.0, 4.0, 4.0, 8.0, 8.0, 9.0, 10.0, 8.0, 17.0, 19.0, 13.0, 44.0, 72.0, 102.0, 132.0, 147.0, 232.0, 363.0, 550.0, 820.0, 1268.0, 2252.0, 3857.0, 7165.0, 14495.0, 31165.0, 71220.0, 198695.0, 5734360.0, 125225.0, 51279.0, 23007.0, 10842.0, 5729.0, 3179.0, 1928.0, 1016.0, 715.0, 465.0, 282.0, 189.0, 145.0, 98.0, 86.0, 60.0, 38.0, 31.0, 22.0, 21.0, 6.0, 9.0, 12.0, 5.0, 4.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-8.484375, -8.21337890625, -7.9423828125, -7.67138671875, -7.400390625, -7.12939453125, -6.8583984375, -6.58740234375, -6.31640625, -6.04541015625, -5.7744140625, -5.50341796875, -5.232421875, -4.96142578125, -4.6904296875, -4.41943359375, -4.1484375, -3.87744140625, -3.6064453125, -3.33544921875, -3.064453125, -2.79345703125, -2.5224609375, -2.25146484375, -1.98046875, -1.70947265625, -1.4384765625, -1.16748046875, -0.896484375, -0.62548828125, -0.3544921875, -0.08349609375, 0.1875, 0.45849609375, 0.7294921875, 1.00048828125, 1.271484375, 1.54248046875, 1.8134765625, 2.08447265625, 2.35546875, 2.62646484375, 2.8974609375, 3.16845703125, 3.439453125, 3.71044921875, 3.9814453125, 4.25244140625, 4.5234375, 4.79443359375, 5.0654296875, 5.33642578125, 5.607421875, 5.87841796875, 6.1494140625, 6.42041015625, 6.69140625, 6.96240234375, 7.2333984375, 7.50439453125, 7.775390625, 8.04638671875, 8.3173828125, 8.58837890625, 8.859375]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 5.0, 7.0, 5.0, 8.0, 10.0, 13.0, 13.0, 9.0, 16.0, 20.0, 22.0, 24.0, 26.0, 26.0, 36.0, 36.0, 33.0, 30.0, 38.0, 49.0, 225.0, 786.0, 130.0, 61.0, 47.0, 34.0, 33.0, 37.0, 28.0, 27.0, 23.0, 26.0, 28.0, 26.0, 16.0, 10.0, 9.0, 12.0, 8.0, 11.0, 10.0, 6.0, 3.0, 2.0, 5.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-12.546875, -12.1827392578125, -11.818603515625, -11.4544677734375, -11.09033203125, -10.7261962890625, -10.362060546875, -9.9979248046875, -9.6337890625, -9.2696533203125, -8.905517578125, -8.5413818359375, -8.17724609375, -7.8131103515625, -7.448974609375, -7.0848388671875, -6.720703125, -6.3565673828125, -5.992431640625, -5.6282958984375, -5.26416015625, -4.9000244140625, -4.535888671875, -4.1717529296875, -3.8076171875, -3.4434814453125, -3.079345703125, -2.7152099609375, -2.35107421875, -1.9869384765625, -1.622802734375, -1.2586669921875, -0.89453125, -0.5303955078125, -0.166259765625, 0.1978759765625, 0.56201171875, 0.9261474609375, 1.290283203125, 1.6544189453125, 2.0185546875, 2.3826904296875, 2.746826171875, 3.1109619140625, 3.47509765625, 3.8392333984375, 4.203369140625, 4.5675048828125, 4.931640625, 5.2957763671875, 5.659912109375, 6.0240478515625, 6.38818359375, 6.7523193359375, 7.116455078125, 7.4805908203125, 7.8447265625, 8.2088623046875, 8.572998046875, 8.9371337890625, 9.30126953125, 9.6654052734375, 10.029541015625, 10.3936767578125, 10.7578125]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 5.0, 1.0, 4.0, 2.0, 8.0, 11.0, 14.0, 16.0, 29.0, 33.0, 66.0, 72.0, 94.0, 133.0, 130.0, 132.0, 77.0, 48.0, 35.0, 28.0, 17.0, 18.0, 8.0, 3.0, 5.0, 7.0, 4.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.085384368896484, -23.286029815673828, -22.486675262451172, -21.68732261657715, -20.887968063354492, -20.088613510131836, -19.289260864257812, -18.489906311035156, -17.6905517578125, -16.891197204589844, -16.091842651367188, -15.292490005493164, -14.493135452270508, -13.693780899047852, -12.894427299499512, -12.095073699951172, -11.295719146728516, -10.49636459350586, -9.69701099395752, -8.89765739440918, -8.098302841186523, -7.298948764801025, -6.499594688415527, -5.700240612030029, -4.900886535644531, -4.101532459259033, -3.302178382873535, -2.502824306488037, -1.703470230102539, -0.904116153717041, -0.10476207733154297, 0.6945919990539551, 1.4939441680908203, 2.2932982444763184, 3.0926523208618164, 3.8920063972473145, 4.6913604736328125, 5.4907145500183105, 6.290068626403809, 7.089422702789307, 7.888776779174805, 8.688131332397461, 9.4874849319458, 10.28683853149414, 11.086193084716797, 11.885547637939453, 12.684901237487793, 13.484254837036133, 14.283609390258789, 15.082963943481445, 15.882317543029785, 16.681671142578125, 17.48102569580078, 18.280380249023438, 19.079734802246094, 19.879087448120117, 20.678442001342773, 21.47779655456543, 22.277149200439453, 23.07650375366211, 23.875858306884766, 24.675212860107422, 25.474567413330078, 26.2739200592041, 27.073274612426758]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 7.0, 3.0, 9.0, 9.0, 26.0, 16.0, 21.0, 29.0, 50.0, 61.0, 57.0, 74.0, 94.0, 96.0, 92.0, 91.0, 64.0, 51.0, 34.0, 31.0, 29.0, 22.0, 10.0, 8.0, 6.0, 6.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.219627380371094, -43.7860107421875, -42.35239791870117, -40.91878128051758, -39.48516845703125, -38.051551818847656, -36.61793518066406, -35.18431854248047, -33.75070571899414, -32.31708908081055, -30.88347625732422, -29.449859619140625, -28.016244888305664, -26.582630157470703, -25.14901351928711, -23.71539878845215, -22.281784057617188, -20.848169326782227, -19.414554595947266, -17.980937957763672, -16.54732322692871, -15.11370849609375, -13.680092811584473, -12.246477127075195, -10.812862396240234, -9.379247665405273, -7.945631980895996, -6.512016773223877, -5.078401565551758, -3.6447863578796387, -2.2111711502075195, -0.7775554656982422, 0.6560592651367188, 2.089674472808838, 3.523289680480957, 4.956904888153076, 6.390520095825195, 7.8241353034973145, 9.257750511169434, 10.691366195678711, 12.124980926513672, 13.558595657348633, 14.99221134185791, 16.425827026367188, 17.85944175720215, 19.29305648803711, 20.726673126220703, 22.160287857055664, 23.593902587890625, 25.027517318725586, 26.461132049560547, 27.89474868774414, 29.3283634185791, 30.761978149414062, 32.195594787597656, 33.62921142578125, 35.06282424926758, 36.49644088745117, 37.9300537109375, 39.363670349121094, 40.79728698730469, 42.230899810791016, 43.66451644897461, 45.09812927246094, 46.53174591064453]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 3.0, 2.0, 4.0, 7.0, 6.0, 7.0, 5.0, 16.0, 20.0, 14.0, 39.0, 34.0, 52.0, 81.0, 101.0, 159.0, 212.0, 313.0, 457.0, 775.0, 1185.0, 2053.0, 3938.0, 8291.0, 22207.0, 103419.0, 3934269.0, 77218.0, 20115.0, 8370.0, 4210.0, 2318.0, 1406.0, 899.0, 578.0, 440.0, 276.0, 207.0, 154.0, 119.0, 83.0, 67.0, 33.0, 46.0, 16.0, 14.0, 15.0, 12.0, 10.0, 4.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.025390625, -0.9937820434570312, -0.9621734619140625, -0.9305648803710938, -0.898956298828125, -0.8673477172851562, -0.8357391357421875, -0.8041305541992188, -0.77252197265625, -0.7409133911132812, -0.7093048095703125, -0.6776962280273438, -0.646087646484375, -0.6144790649414062, -0.5828704833984375, -0.5512619018554688, -0.5196533203125, -0.48804473876953125, -0.4564361572265625, -0.42482757568359375, -0.393218994140625, -0.36161041259765625, -0.3300018310546875, -0.29839324951171875, -0.26678466796875, -0.23517608642578125, -0.2035675048828125, -0.17195892333984375, -0.140350341796875, -0.10874176025390625, -0.0771331787109375, -0.04552459716796875, -0.013916015625, 0.01769256591796875, 0.0493011474609375, 0.08090972900390625, 0.112518310546875, 0.14412689208984375, 0.1757354736328125, 0.20734405517578125, 0.23895263671875, 0.27056121826171875, 0.3021697998046875, 0.33377838134765625, 0.365386962890625, 0.39699554443359375, 0.4286041259765625, 0.46021270751953125, 0.4918212890625, 0.5234298706054688, 0.5550384521484375, 0.5866470336914062, 0.618255615234375, 0.6498641967773438, 0.6814727783203125, 0.7130813598632812, 0.74468994140625, 0.7762985229492188, 0.8079071044921875, 0.8395156860351562, 0.871124267578125, 0.9027328491210938, 0.9343414306640625, 0.9659500122070312, 0.99755859375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 0.0, 4.0, 4.0, 5.0, 8.0, 3.0, 6.0, 8.0, 16.0, 10.0, 12.0, 24.0, 134.0, 669.0, 16.0, 11.0, 10.0, 17.0, 8.0, 4.0, 4.0, 5.0, 1.0, 5.0, 5.0, 1.0, 4.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.303955078125, -0.29450225830078125, -0.2850494384765625, -0.27559661865234375, -0.266143798828125, -0.25669097900390625, -0.2472381591796875, -0.23778533935546875, -0.22833251953125, -0.21887969970703125, -0.2094268798828125, -0.19997406005859375, -0.190521240234375, -0.18106842041015625, -0.1716156005859375, -0.16216278076171875, -0.1527099609375, -0.14325714111328125, -0.1338043212890625, -0.12435150146484375, -0.114898681640625, -0.10544586181640625, -0.0959930419921875, -0.08654022216796875, -0.07708740234375, -0.06763458251953125, -0.0581817626953125, -0.04872894287109375, -0.039276123046875, -0.02982330322265625, -0.0203704833984375, -0.01091766357421875, -0.00146484375, 0.00798797607421875, 0.0174407958984375, 0.02689361572265625, 0.036346435546875, 0.04579925537109375, 0.0552520751953125, 0.06470489501953125, 0.07415771484375, 0.08361053466796875, 0.0930633544921875, 0.10251617431640625, 0.111968994140625, 0.12142181396484375, 0.1308746337890625, 0.14032745361328125, 0.1497802734375, 0.15923309326171875, 0.1686859130859375, 0.17813873291015625, 0.187591552734375, 0.19704437255859375, 0.2064971923828125, 0.21595001220703125, 0.22540283203125, 0.23485565185546875, 0.2443084716796875, 0.25376129150390625, 0.263214111328125, 0.27266693115234375, 0.2821197509765625, 0.29157257080078125, 0.301025390625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 8.0, 6.0, 7.0, 17.0, 28.0, 26.0, 59.0, 80.0, 133.0, 205.0, 333.0, 535.0, 807.0, 1414.0, 2539.0, 4896.0, 10233.0, 26102.0, 82879.0, 489448.0, 3179223.0, 298901.0, 60327.0, 19506.0, 7983.0, 3735.0, 2017.0, 1141.0, 648.0, 388.0, 241.0, 136.0, 98.0, 64.0, 48.0, 23.0, 18.0, 12.0, 9.0, 7.0, 1.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.72412109375, -0.7017669677734375, -0.679412841796875, -0.6570587158203125, -0.63470458984375, -0.6123504638671875, -0.589996337890625, -0.5676422119140625, -0.5452880859375, -0.5229339599609375, -0.500579833984375, -0.4782257080078125, -0.45587158203125, -0.4335174560546875, -0.411163330078125, -0.3888092041015625, -0.366455078125, -0.3441009521484375, -0.321746826171875, -0.2993927001953125, -0.27703857421875, -0.2546844482421875, -0.232330322265625, -0.2099761962890625, -0.1876220703125, -0.1652679443359375, -0.142913818359375, -0.1205596923828125, -0.09820556640625, -0.0758514404296875, -0.053497314453125, -0.0311431884765625, -0.0087890625, 0.0135650634765625, 0.035919189453125, 0.0582733154296875, 0.08062744140625, 0.1029815673828125, 0.125335693359375, 0.1476898193359375, 0.1700439453125, 0.1923980712890625, 0.214752197265625, 0.2371063232421875, 0.25946044921875, 0.2818145751953125, 0.304168701171875, 0.3265228271484375, 0.348876953125, 0.3712310791015625, 0.393585205078125, 0.4159393310546875, 0.43829345703125, 0.4606475830078125, 0.483001708984375, 0.5053558349609375, 0.5277099609375, 0.5500640869140625, 0.572418212890625, 0.5947723388671875, 0.61712646484375, 0.6394805908203125, 0.661834716796875, 0.6841888427734375, 0.70654296875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 6.0, 4.0, 4.0, 2.0, 5.0, 6.0, 3.0, 7.0, 11.0, 14.0, 26.0, 27.0, 38.0, 55.0, 63.0, 112.0, 220.0, 419.0, 1340.0, 935.0, 321.0, 170.0, 91.0, 61.0, 38.0, 29.0, 25.0, 12.0, 10.0, 5.0, 3.0, 2.0, 5.0, 1.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.382080078125, -0.37078857421875, -0.3594970703125, -0.34820556640625, -0.3369140625, -0.32562255859375, -0.3143310546875, -0.30303955078125, -0.291748046875, -0.28045654296875, -0.2691650390625, -0.25787353515625, -0.24658203125, -0.23529052734375, -0.2239990234375, -0.21270751953125, -0.201416015625, -0.19012451171875, -0.1788330078125, -0.16754150390625, -0.15625, -0.14495849609375, -0.1336669921875, -0.12237548828125, -0.111083984375, -0.09979248046875, -0.0885009765625, -0.07720947265625, -0.06591796875, -0.05462646484375, -0.0433349609375, -0.03204345703125, -0.020751953125, -0.00946044921875, 0.0018310546875, 0.01312255859375, 0.0244140625, 0.03570556640625, 0.0469970703125, 0.05828857421875, 0.069580078125, 0.08087158203125, 0.0921630859375, 0.10345458984375, 0.11474609375, 0.12603759765625, 0.1373291015625, 0.14862060546875, 0.159912109375, 0.17120361328125, 0.1824951171875, 0.19378662109375, 0.205078125, 0.21636962890625, 0.2276611328125, 0.23895263671875, 0.250244140625, 0.26153564453125, 0.2728271484375, 0.28411865234375, 0.29541015625, 0.30670166015625, 0.3179931640625, 0.32928466796875, 0.340576171875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 7.0, 12.0, 15.0, 40.0, 61.0, 139.0, 183.0, 221.0, 131.0, 92.0, 53.0, 29.0, 6.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.9518307447433472, -1.8877747058868408, -1.8237186670303345, -1.7596626281738281, -1.6956065893173218, -1.6315505504608154, -1.5674943923950195, -1.5034384727478027, -1.4393823146820068, -1.3753262758255005, -1.3112702369689941, -1.2472141981124878, -1.1831581592559814, -1.119102120399475, -1.0550460815429688, -0.9909899830818176, -0.926934003829956, -0.8628779649734497, -0.7988219261169434, -0.734765887260437, -0.6707098484039307, -0.6066538095474243, -0.5425977110862732, -0.47854167222976685, -0.4144856333732605, -0.35042959451675415, -0.2863735556602478, -0.22231748700141907, -0.15826144814491272, -0.09420540928840637, -0.030149340629577637, 0.03390669822692871, 0.09796285629272461, 0.16201889514923096, 0.2260749489068985, 0.29013100266456604, 0.3541870415210724, 0.41824308037757874, 0.48229914903640747, 0.5463551878929138, 0.6104112267494202, 0.6744672656059265, 0.7385233044624329, 0.802579402923584, 0.8666354417800903, 0.9306914806365967, 0.994747519493103, 1.0588035583496094, 1.1228595972061157, 1.186915636062622, 1.2509716749191284, 1.3150277137756348, 1.3790837526321411, 1.4431397914886475, 1.5071959495544434, 1.5712518692016602, 1.635308027267456, 1.6993640661239624, 1.7634201049804688, 1.827476143836975, 1.8915321826934814, 1.9555882215499878, 2.019644260406494, 2.08370041847229, 2.147756338119507]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 3.0, 3.0, 3.0, 1.0, 4.0, 12.0, 11.0, 16.0, 22.0, 22.0, 34.0, 34.0, 47.0, 58.0, 55.0, 59.0, 75.0, 86.0, 71.0, 78.0, 61.0, 55.0, 49.0, 40.0, 29.0, 19.0, 12.0, 15.0, 17.0, 7.0, 5.0, 9.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5357944965362549, -1.4858287572860718, -1.4358630180358887, -1.3858972787857056, -1.3359315395355225, -1.285965919494629, -1.2360001802444458, -1.1860344409942627, -1.1360687017440796, -1.0861029624938965, -1.0361372232437134, -0.986171543598175, -0.9362058043479919, -0.8862400650978088, -0.8362743854522705, -0.7863086462020874, -0.7363429069519043, -0.6863771677017212, -0.6364114284515381, -0.5864457488059998, -0.5364800095558167, -0.48651427030563354, -0.4365485608577728, -0.3865828514099121, -0.336617112159729, -0.2866513729095459, -0.23668566346168518, -0.18671993911266327, -0.13675421476364136, -0.08678849041461945, -0.036822766065597534, 0.013142943382263184, 0.06310880184173584, 0.11307452619075775, 0.16304025053977966, 0.21300597488880157, 0.2629716992378235, 0.3129374384880066, 0.3629031479358673, 0.412868857383728, 0.46283459663391113, 0.5128003358840942, 0.5627660751342773, 0.6127317547798157, 0.6626974940299988, 0.7126632332801819, 0.7626289129257202, 0.8125946521759033, 0.8625603914260864, 0.9125261306762695, 0.9624918699264526, 1.0124576091766357, 1.0624232292175293, 1.1123889684677124, 1.1623547077178955, 1.2123204469680786, 1.2622861862182617, 1.3122519254684448, 1.362217664718628, 1.412183403968811, 1.4621491432189941, 1.5121147632598877, 1.5620805025100708, 1.612046241760254, 1.662011981010437]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 3.0, 3.0, 7.0, 11.0, 16.0, 23.0, 36.0, 46.0, 66.0, 78.0, 132.0, 180.0, 279.0, 353.0, 531.0, 715.0, 1045.0, 1611.0, 2498.0, 3894.0, 6443.0, 11357.0, 22655.0, 94297.0, 818239.0, 42155.0, 17335.0, 9247.0, 5385.0, 3254.0, 2114.0, 1378.0, 983.0, 657.0, 462.0, 318.0, 230.0, 167.0, 112.0, 81.0, 50.0, 29.0, 22.0, 23.0, 15.0, 12.0, 8.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9169921875, -0.8886184692382812, -0.8602447509765625, -0.8318710327148438, -0.803497314453125, -0.7751235961914062, -0.7467498779296875, -0.7183761596679688, -0.69000244140625, -0.6616287231445312, -0.6332550048828125, -0.6048812866210938, -0.576507568359375, -0.5481338500976562, -0.5197601318359375, -0.49138641357421875, -0.4630126953125, -0.43463897705078125, -0.4062652587890625, -0.37789154052734375, -0.349517822265625, -0.32114410400390625, -0.2927703857421875, -0.26439666748046875, -0.23602294921875, -0.20764923095703125, -0.1792755126953125, -0.15090179443359375, -0.122528076171875, -0.09415435791015625, -0.0657806396484375, -0.03740692138671875, -0.009033203125, 0.01934051513671875, 0.0477142333984375, 0.07608795166015625, 0.104461669921875, 0.13283538818359375, 0.1612091064453125, 0.18958282470703125, 0.21795654296875, 0.24633026123046875, 0.2747039794921875, 0.30307769775390625, 0.331451416015625, 0.35982513427734375, 0.3881988525390625, 0.41657257080078125, 0.4449462890625, 0.47332000732421875, 0.5016937255859375, 0.5300674438476562, 0.558441162109375, 0.5868148803710938, 0.6151885986328125, 0.6435623168945312, 0.67193603515625, 0.7003097534179688, 0.7286834716796875, 0.7570571899414062, 0.785430908203125, 0.8138046264648438, 0.8421783447265625, 0.8705520629882812, 0.89892578125]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 1.0, 3.0, 5.0, 2.0, 9.0, 3.0, 5.0, 5.0, 11.0, 9.0, 19.0, 20.0, 82.0, 405.0, 299.0, 45.0, 9.0, 10.0, 14.0, 6.0, 5.0, 7.0, 3.0, 4.0, 3.0, 3.0, 3.0, 4.0, 3.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2822265625, -0.27338409423828125, -0.2645416259765625, -0.25569915771484375, -0.246856689453125, -0.23801422119140625, -0.2291717529296875, -0.22032928466796875, -0.21148681640625, -0.20264434814453125, -0.1938018798828125, -0.18495941162109375, -0.176116943359375, -0.16727447509765625, -0.1584320068359375, -0.14958953857421875, -0.1407470703125, -0.13190460205078125, -0.1230621337890625, -0.11421966552734375, -0.105377197265625, -0.09653472900390625, -0.0876922607421875, -0.07884979248046875, -0.07000732421875, -0.06116485595703125, -0.0523223876953125, -0.04347991943359375, -0.034637451171875, -0.02579498291015625, -0.0169525146484375, -0.00811004638671875, 0.000732421875, 0.00957489013671875, 0.0184173583984375, 0.02725982666015625, 0.036102294921875, 0.04494476318359375, 0.0537872314453125, 0.06262969970703125, 0.07147216796875, 0.08031463623046875, 0.0891571044921875, 0.09799957275390625, 0.106842041015625, 0.11568450927734375, 0.1245269775390625, 0.13336944580078125, 0.1422119140625, 0.15105438232421875, 0.1598968505859375, 0.16873931884765625, 0.177581787109375, 0.18642425537109375, 0.1952667236328125, 0.20410919189453125, 0.21295166015625, 0.22179412841796875, 0.2306365966796875, 0.23947906494140625, 0.248321533203125, 0.25716400146484375, 0.2660064697265625, 0.27484893798828125, 0.28369140625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 5.0, 3.0, 2.0, 3.0, 6.0, 11.0, 12.0, 19.0, 28.0, 29.0, 59.0, 78.0, 105.0, 127.0, 187.0, 257.0, 400.0, 629.0, 966.0, 1425.0, 2361.0, 4091.0, 6827.0, 12397.0, 22583.0, 43917.0, 90770.0, 208490.0, 333726.0, 164491.0, 73426.0, 36048.0, 19150.0, 10370.0, 5988.0, 3524.0, 2084.0, 1368.0, 827.0, 555.0, 378.0, 252.0, 177.0, 118.0, 73.0, 65.0, 38.0, 43.0, 22.0, 20.0, 11.0, 7.0, 7.0, 5.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.548828125, -0.5301361083984375, -0.511444091796875, -0.4927520751953125, -0.47406005859375, -0.4553680419921875, -0.436676025390625, -0.4179840087890625, -0.3992919921875, -0.3805999755859375, -0.361907958984375, -0.3432159423828125, -0.32452392578125, -0.3058319091796875, -0.287139892578125, -0.2684478759765625, -0.249755859375, -0.2310638427734375, -0.212371826171875, -0.1936798095703125, -0.17498779296875, -0.1562957763671875, -0.137603759765625, -0.1189117431640625, -0.1002197265625, -0.0815277099609375, -0.062835693359375, -0.0441436767578125, -0.02545166015625, -0.0067596435546875, 0.011932373046875, 0.0306243896484375, 0.04931640625, 0.0680084228515625, 0.086700439453125, 0.1053924560546875, 0.12408447265625, 0.1427764892578125, 0.161468505859375, 0.1801605224609375, 0.1988525390625, 0.2175445556640625, 0.236236572265625, 0.2549285888671875, 0.27362060546875, 0.2923126220703125, 0.311004638671875, 0.3296966552734375, 0.348388671875, 0.3670806884765625, 0.385772705078125, 0.4044647216796875, 0.42315673828125, 0.4418487548828125, 0.460540771484375, 0.4792327880859375, 0.4979248046875, 0.5166168212890625, 0.535308837890625, 0.5540008544921875, 0.57269287109375, 0.5913848876953125, 0.610076904296875, 0.6287689208984375, 0.6474609375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 5.0, 5.0, 5.0, 11.0, 16.0, 11.0, 9.0, 21.0, 22.0, 16.0, 25.0, 32.0, 35.0, 31.0, 32.0, 44.0, 34.0, 33.0, 44.0, 48.0, 46.0, 49.0, 48.0, 50.0, 36.0, 42.0, 36.0, 29.0, 28.0, 27.0, 22.0, 17.0, 13.0, 23.0, 11.0, 16.0, 10.0, 7.0, 3.0, 5.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0], "bins": [-1.1455078125, -1.1130828857421875, -1.080657958984375, -1.0482330322265625, -1.01580810546875, -0.9833831787109375, -0.950958251953125, -0.9185333251953125, -0.8861083984375, -0.8536834716796875, -0.821258544921875, -0.7888336181640625, -0.75640869140625, -0.7239837646484375, -0.691558837890625, -0.6591339111328125, -0.626708984375, -0.5942840576171875, -0.561859130859375, -0.5294342041015625, -0.49700927734375, -0.4645843505859375, -0.432159423828125, -0.3997344970703125, -0.3673095703125, -0.3348846435546875, -0.302459716796875, -0.2700347900390625, -0.23760986328125, -0.2051849365234375, -0.172760009765625, -0.1403350830078125, -0.10791015625, -0.0754852294921875, -0.043060302734375, -0.0106353759765625, 0.02178955078125, 0.0542144775390625, 0.086639404296875, 0.1190643310546875, 0.1514892578125, 0.1839141845703125, 0.216339111328125, 0.2487640380859375, 0.28118896484375, 0.3136138916015625, 0.346038818359375, 0.3784637451171875, 0.410888671875, 0.4433135986328125, 0.475738525390625, 0.5081634521484375, 0.54058837890625, 0.5730133056640625, 0.605438232421875, 0.6378631591796875, 0.6702880859375, 0.7027130126953125, 0.735137939453125, 0.7675628662109375, 0.79998779296875, 0.8324127197265625, 0.864837646484375, 0.8972625732421875, 0.9296875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 5.0, 5.0, 10.0, 17.0, 28.0, 37.0, 66.0, 146.0, 383.0, 1507.0, 13761.0, 969298.0, 59222.0, 3063.0, 583.0, 205.0, 93.0, 54.0, 31.0, 14.0, 15.0, 7.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.400390625, -3.3023681640625, -3.204345703125, -3.1063232421875, -3.00830078125, -2.9102783203125, -2.812255859375, -2.7142333984375, -2.6162109375, -2.5181884765625, -2.420166015625, -2.3221435546875, -2.22412109375, -2.1260986328125, -2.028076171875, -1.9300537109375, -1.83203125, -1.7340087890625, -1.635986328125, -1.5379638671875, -1.43994140625, -1.3419189453125, -1.243896484375, -1.1458740234375, -1.0478515625, -0.9498291015625, -0.851806640625, -0.7537841796875, -0.65576171875, -0.5577392578125, -0.459716796875, -0.3616943359375, -0.263671875, -0.1656494140625, -0.067626953125, 0.0303955078125, 0.12841796875, 0.2264404296875, 0.324462890625, 0.4224853515625, 0.5205078125, 0.6185302734375, 0.716552734375, 0.8145751953125, 0.91259765625, 1.0106201171875, 1.108642578125, 1.2066650390625, 1.3046875, 1.4027099609375, 1.500732421875, 1.5987548828125, 1.69677734375, 1.7947998046875, 1.892822265625, 1.9908447265625, 2.0888671875, 2.1868896484375, 2.284912109375, 2.3829345703125, 2.48095703125, 2.5789794921875, 2.677001953125, 2.7750244140625, 2.873046875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 6.0, 7.0, 9.0, 23.0, 59.0, 101.0, 170.0, 211.0, 195.0, 90.0, 73.0, 28.0, 14.0, 9.0, 9.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001780986785888672, -0.00017400365322828293, -0.00016990862786769867, -0.0001658136025071144, -0.00016171857714653015, -0.0001576235517859459, -0.00015352852642536163, -0.00014943350106477737, -0.00014533847570419312, -0.00014124345034360886, -0.0001371484249830246, -0.00013305339962244034, -0.00012895837426185608, -0.00012486334890127182, -0.00012076832354068756, -0.0001166732981801033, -0.00011257827281951904, -0.00010848324745893478, -0.00010438822209835052, -0.00010029319673776627, -9.619817137718201e-05, -9.210314601659775e-05, -8.800812065601349e-05, -8.391309529542923e-05, -7.981806993484497e-05, -7.572304457426071e-05, -7.162801921367645e-05, -6.75329938530922e-05, -6.343796849250793e-05, -5.9342943131923676e-05, -5.5247917771339417e-05, -5.115289241075516e-05, -4.70578670501709e-05, -4.296284168958664e-05, -3.886781632900238e-05, -3.477279096841812e-05, -3.067776560783386e-05, -2.6582740247249603e-05, -2.2487714886665344e-05, -1.8392689526081085e-05, -1.4297664165496826e-05, -1.0202638804912567e-05, -6.107613444328308e-06, -2.012588083744049e-06, 2.08243727684021e-06, 6.177462637424469e-06, 1.0272487998008728e-05, 1.4367513358592987e-05, 1.8462538719177246e-05, 2.2557564079761505e-05, 2.6652589440345764e-05, 3.074761480093002e-05, 3.484264016151428e-05, 3.893766552209854e-05, 4.30326908826828e-05, 4.712771624326706e-05, 5.122274160385132e-05, 5.531776696443558e-05, 5.9412792325019836e-05, 6.35078176856041e-05, 6.760284304618835e-05, 7.169786840677261e-05, 7.579289376735687e-05, 7.988791912794113e-05, 8.398294448852539e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 6.0, 4.0, 3.0, 5.0, 5.0, 8.0, 15.0, 22.0, 25.0, 40.0, 51.0, 77.0, 118.0, 214.0, 340.0, 652.0, 1574.0, 3997.0, 14091.0, 81610.0, 685396.0, 221721.0, 27545.0, 6560.0, 2275.0, 990.0, 480.0, 299.0, 132.0, 120.0, 58.0, 48.0, 25.0, 22.0, 13.0, 7.0, 3.0, 6.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0263671875, -0.987945556640625, -0.94952392578125, -0.911102294921875, -0.8726806640625, -0.834259033203125, -0.79583740234375, -0.757415771484375, -0.718994140625, -0.680572509765625, -0.64215087890625, -0.603729248046875, -0.5653076171875, -0.526885986328125, -0.48846435546875, -0.450042724609375, -0.41162109375, -0.373199462890625, -0.33477783203125, -0.296356201171875, -0.2579345703125, -0.219512939453125, -0.18109130859375, -0.142669677734375, -0.104248046875, -0.065826416015625, -0.02740478515625, 0.011016845703125, 0.0494384765625, 0.087860107421875, 0.12628173828125, 0.164703369140625, 0.203125, 0.241546630859375, 0.27996826171875, 0.318389892578125, 0.3568115234375, 0.395233154296875, 0.43365478515625, 0.472076416015625, 0.510498046875, 0.548919677734375, 0.58734130859375, 0.625762939453125, 0.6641845703125, 0.702606201171875, 0.74102783203125, 0.779449462890625, 0.81787109375, 0.856292724609375, 0.89471435546875, 0.933135986328125, 0.9715576171875, 1.009979248046875, 1.04840087890625, 1.086822509765625, 1.125244140625, 1.163665771484375, 1.20208740234375, 1.240509033203125, 1.2789306640625, 1.317352294921875, 1.35577392578125, 1.394195556640625, 1.4326171875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 9.0, 8.0, 11.0, 25.0, 40.0, 43.0, 91.0, 121.0, 121.0, 131.0, 131.0, 105.0, 68.0, 34.0, 21.0, 17.0, 9.0, 6.0, 2.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9443359375, -0.899139404296875, -0.85394287109375, -0.808746337890625, -0.7635498046875, -0.718353271484375, -0.67315673828125, -0.627960205078125, -0.582763671875, -0.537567138671875, -0.49237060546875, -0.447174072265625, -0.4019775390625, -0.356781005859375, -0.31158447265625, -0.266387939453125, -0.22119140625, -0.175994873046875, -0.13079833984375, -0.085601806640625, -0.0404052734375, 0.004791259765625, 0.04998779296875, 0.095184326171875, 0.140380859375, 0.185577392578125, 0.23077392578125, 0.275970458984375, 0.3211669921875, 0.366363525390625, 0.41156005859375, 0.456756591796875, 0.501953125, 0.547149658203125, 0.59234619140625, 0.637542724609375, 0.6827392578125, 0.727935791015625, 0.77313232421875, 0.818328857421875, 0.863525390625, 0.908721923828125, 0.95391845703125, 0.999114990234375, 1.0443115234375, 1.089508056640625, 1.13470458984375, 1.179901123046875, 1.22509765625, 1.270294189453125, 1.31549072265625, 1.360687255859375, 1.4058837890625, 1.451080322265625, 1.49627685546875, 1.541473388671875, 1.586669921875, 1.631866455078125, 1.67706298828125, 1.722259521484375, 1.7674560546875, 1.812652587890625, 1.85784912109375, 1.903045654296875, 1.9482421875]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 5.0, 9.0, 14.0, 11.0, 28.0, 45.0, 91.0, 168.0, 233.0, 164.0, 81.0, 53.0, 38.0, 23.0, 14.0, 7.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.532609939575195, -9.185256004333496, -8.837903022766113, -8.490549087524414, -8.143196105957031, -7.795842170715332, -7.448488235473633, -7.101134777069092, -6.753781318664551, -6.40642786026001, -6.059074401855469, -5.7117204666137695, -5.3643670082092285, -5.0170135498046875, -4.669659614562988, -4.322306156158447, -3.9749526977539062, -3.6275992393493652, -3.280245542526245, -2.932891845703125, -2.585538387298584, -2.238184928894043, -1.8908312320709229, -1.5434775352478027, -1.1961240768432617, -0.8487704992294312, -0.5014169216156006, -0.15406334400177002, 0.19329023361206055, 0.5406438112258911, 0.8879973888397217, 1.2353510856628418, 1.5827054977416992, 1.9300590753555298, 2.2774126529693604, 2.6247663497924805, 2.9721198081970215, 3.3194732666015625, 3.6668269634246826, 4.014180660247803, 4.361534118652344, 4.708887577056885, 5.056241035461426, 5.403594970703125, 5.750948429107666, 6.098301887512207, 6.445655822753906, 6.793009281158447, 7.140362739562988, 7.487716197967529, 7.83506965637207, 8.18242359161377, 8.529777526855469, 8.877130508422852, 9.22448444366455, 9.57183837890625, 9.919191360473633, 10.266545295715332, 10.613898277282715, 10.961252212524414, 11.308605194091797, 11.655959129333496, 12.003313064575195, 12.350666046142578, 12.698019981384277]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 1.0, 2.0, 3.0, 3.0, 8.0, 9.0, 3.0, 8.0, 15.0, 15.0, 13.0, 39.0, 62.0, 106.0, 130.0, 167.0, 140.0, 99.0, 59.0, 30.0, 28.0, 14.0, 10.0, 6.0, 6.0, 5.0, 6.0, 0.0, 3.0, 5.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.883638381958008, -21.227081298828125, -20.57052230834961, -19.913965225219727, -19.257408142089844, -18.600849151611328, -17.944292068481445, -17.287734985351562, -16.631175994873047, -15.974617958068848, -15.318059921264648, -14.661502838134766, -14.004944801330566, -13.348386764526367, -12.691829681396484, -12.035271644592285, -11.378713607788086, -10.722155570983887, -10.065597534179688, -9.409040451049805, -8.752482414245605, -8.095924377441406, -7.439366817474365, -6.782809257507324, -6.126251220703125, -5.469693183898926, -4.813135623931885, -4.156578063964844, -3.5000200271606445, -2.8434622287750244, -2.1869044303894043, -1.5303468704223633, -0.8737907409667969, -0.21723294258117676, 0.43932485580444336, 1.0958826541900635, 1.7524404525756836, 2.4089982509613037, 3.065556049346924, 3.722113609313965, 4.378671646118164, 5.035229682922363, 5.691787242889404, 6.348344802856445, 7.0049028396606445, 7.661460876464844, 8.318017959594727, 8.974575996398926, 9.631134033203125, 10.287692070007324, 10.944250106811523, 11.600807189941406, 12.257365226745605, 12.913923263549805, 13.570480346679688, 14.227038383483887, 14.883596420288086, 15.540154457092285, 16.196712493896484, 16.853269577026367, 17.50982666015625, 18.166385650634766, 18.82294273376465, 19.47949981689453, 20.136058807373047]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 9.0, 4.0, 13.0, 16.0, 25.0, 20.0, 33.0, 52.0, 76.0, 104.0, 125.0, 195.0, 255.0, 351.0, 457.0, 609.0, 907.0, 1297.0, 1928.0, 3221.0, 5923.0, 13002.0, 38951.0, 468225.0, 3567649.0, 57537.0, 15798.0, 6954.0, 3611.0, 2226.0, 1443.0, 963.0, 677.0, 466.0, 344.0, 234.0, 151.0, 121.0, 76.0, 73.0, 43.0, 33.0, 24.0, 17.0, 18.0, 13.0, 6.0, 4.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.412109375, -2.33929443359375, -2.2664794921875, -2.19366455078125, -2.120849609375, -2.04803466796875, -1.9752197265625, -1.90240478515625, -1.82958984375, -1.75677490234375, -1.6839599609375, -1.61114501953125, -1.538330078125, -1.46551513671875, -1.3927001953125, -1.31988525390625, -1.2470703125, -1.17425537109375, -1.1014404296875, -1.02862548828125, -0.955810546875, -0.88299560546875, -0.8101806640625, -0.73736572265625, -0.66455078125, -0.59173583984375, -0.5189208984375, -0.44610595703125, -0.373291015625, -0.30047607421875, -0.2276611328125, -0.15484619140625, -0.08203125, -0.00921630859375, 0.0635986328125, 0.13641357421875, 0.209228515625, 0.28204345703125, 0.3548583984375, 0.42767333984375, 0.50048828125, 0.57330322265625, 0.6461181640625, 0.71893310546875, 0.791748046875, 0.86456298828125, 0.9373779296875, 1.01019287109375, 1.0830078125, 1.15582275390625, 1.2286376953125, 1.30145263671875, 1.374267578125, 1.44708251953125, 1.5198974609375, 1.59271240234375, 1.66552734375, 1.73834228515625, 1.8111572265625, 1.88397216796875, 1.956787109375, 2.02960205078125, 2.1024169921875, 2.17523193359375, 2.248046875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 3.0, 1.0, 6.0, 3.0, 4.0, 1.0, 4.0, 2.0, 2.0, 4.0, 3.0, 3.0, 9.0, 12.0, 13.0, 18.0, 10.0, 27.0, 54.0, 96.0, 164.0, 219.0, 134.0, 79.0, 27.0, 21.0, 11.0, 10.0, 12.0, 5.0, 7.0, 6.0, 5.0, 8.0, 5.0, 8.0, 1.0, 2.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2230224609375, -0.21610069274902344, -0.20917892456054688, -0.2022571563720703, -0.19533538818359375, -0.1884136199951172, -0.18149185180664062, -0.17457008361816406, -0.1676483154296875, -0.16072654724121094, -0.15380477905273438, -0.1468830108642578, -0.13996124267578125, -0.1330394744873047, -0.12611770629882812, -0.11919593811035156, -0.112274169921875, -0.10535240173339844, -0.09843063354492188, -0.09150886535644531, -0.08458709716796875, -0.07766532897949219, -0.07074356079101562, -0.06382179260253906, -0.0569000244140625, -0.04997825622558594, -0.043056488037109375, -0.03613471984863281, -0.02921295166015625, -0.022291183471679688, -0.015369415283203125, -0.008447647094726562, -0.00152587890625, 0.0053958892822265625, 0.012317657470703125, 0.019239425659179688, 0.02616119384765625, 0.03308296203613281, 0.040004730224609375, 0.04692649841308594, 0.0538482666015625, 0.06077003479003906, 0.06769180297851562, 0.07461357116699219, 0.08153533935546875, 0.08845710754394531, 0.09537887573242188, 0.10230064392089844, 0.109222412109375, 0.11614418029785156, 0.12306594848632812, 0.1299877166748047, 0.13690948486328125, 0.1438312530517578, 0.15075302124023438, 0.15767478942871094, 0.1645965576171875, 0.17151832580566406, 0.17844009399414062, 0.1853618621826172, 0.19228363037109375, 0.1992053985595703, 0.20612716674804688, 0.21304893493652344, 0.219970703125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 6.0, 7.0, 11.0, 15.0, 23.0, 21.0, 22.0, 43.0, 58.0, 76.0, 129.0, 162.0, 221.0, 385.0, 575.0, 813.0, 1251.0, 1941.0, 3234.0, 5487.0, 10211.0, 21073.0, 55148.0, 263442.0, 3427296.0, 299124.0, 58122.0, 21331.0, 10090.0, 5411.0, 3054.0, 1941.0, 1097.0, 777.0, 505.0, 371.0, 232.0, 161.0, 108.0, 81.0, 75.0, 42.0, 22.0, 25.0, 19.0, 17.0, 9.0, 9.0, 4.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.494140625, -1.4481964111328125, -1.402252197265625, -1.3563079833984375, -1.31036376953125, -1.2644195556640625, -1.218475341796875, -1.1725311279296875, -1.1265869140625, -1.0806427001953125, -1.034698486328125, -0.9887542724609375, -0.94281005859375, -0.8968658447265625, -0.850921630859375, -0.8049774169921875, -0.759033203125, -0.7130889892578125, -0.667144775390625, -0.6212005615234375, -0.57525634765625, -0.5293121337890625, -0.483367919921875, -0.4374237060546875, -0.3914794921875, -0.3455352783203125, -0.299591064453125, -0.2536468505859375, -0.20770263671875, -0.1617584228515625, -0.115814208984375, -0.0698699951171875, -0.02392578125, 0.0220184326171875, 0.067962646484375, 0.1139068603515625, 0.15985107421875, 0.2057952880859375, 0.251739501953125, 0.2976837158203125, 0.3436279296875, 0.3895721435546875, 0.435516357421875, 0.4814605712890625, 0.52740478515625, 0.5733489990234375, 0.619293212890625, 0.6652374267578125, 0.711181640625, 0.7571258544921875, 0.803070068359375, 0.8490142822265625, 0.89495849609375, 0.9409027099609375, 0.986846923828125, 1.0327911376953125, 1.0787353515625, 1.1246795654296875, 1.170623779296875, 1.2165679931640625, 1.26251220703125, 1.3084564208984375, 1.354400634765625, 1.4003448486328125, 1.4462890625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 5.0, 8.0, 2.0, 7.0, 12.0, 7.0, 12.0, 15.0, 10.0, 20.0, 25.0, 36.0, 43.0, 82.0, 178.0, 573.0, 2012.0, 483.0, 214.0, 124.0, 62.0, 40.0, 18.0, 17.0, 9.0, 15.0, 8.0, 9.0, 7.0, 3.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.453125, -0.4409942626953125, -0.428863525390625, -0.4167327880859375, -0.40460205078125, -0.3924713134765625, -0.380340576171875, -0.3682098388671875, -0.3560791015625, -0.3439483642578125, -0.331817626953125, -0.3196868896484375, -0.30755615234375, -0.2954254150390625, -0.283294677734375, -0.2711639404296875, -0.259033203125, -0.2469024658203125, -0.234771728515625, -0.2226409912109375, -0.21051025390625, -0.1983795166015625, -0.186248779296875, -0.1741180419921875, -0.1619873046875, -0.1498565673828125, -0.137725830078125, -0.1255950927734375, -0.11346435546875, -0.1013336181640625, -0.089202880859375, -0.0770721435546875, -0.06494140625, -0.0528106689453125, -0.040679931640625, -0.0285491943359375, -0.01641845703125, -0.0042877197265625, 0.007843017578125, 0.0199737548828125, 0.0321044921875, 0.0442352294921875, 0.056365966796875, 0.0684967041015625, 0.08062744140625, 0.0927581787109375, 0.104888916015625, 0.1170196533203125, 0.129150390625, 0.1412811279296875, 0.153411865234375, 0.1655426025390625, 0.17767333984375, 0.1898040771484375, 0.201934814453125, 0.2140655517578125, 0.2261962890625, 0.2383270263671875, 0.250457763671875, 0.2625885009765625, 0.27471923828125, 0.2868499755859375, 0.298980712890625, 0.3111114501953125, 0.3232421875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 5.0, 8.0, 39.0, 93.0, 370.0, 316.0, 83.0, 40.0, 19.0, 15.0, 4.0, 3.0, 3.0, 1.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7284982204437256, -1.5678640604019165, -1.4072299003601074, -1.2465956211090088, -1.0859615802764893, -0.9253273606300354, -0.7646931409835815, -0.6040589809417725, -0.4434248208999634, -0.2827906608581543, -0.12215647101402283, 0.03847771883010864, 0.19911187887191772, 0.3597460389137268, 0.5203802585601807, 0.6810144186019897, 0.8416485786437988, 1.002282738685608, 1.162916898727417, 1.3235511779785156, 1.4841852188110352, 1.6448194980621338, 1.8054536581039429, 1.966087818145752, 2.1267218589782715, 2.28735613822937, 2.4479901790618896, 2.6086244583129883, 2.769258499145508, 2.9298927783966064, 3.090527057647705, 3.2511610984802246, 3.411795139312744, 3.5724294185638428, 3.7330634593963623, 3.893697738647461, 4.0543317794799805, 4.2149658203125, 4.375600337982178, 4.536234378814697, 4.696868419647217, 4.857502460479736, 5.018136978149414, 5.178771018981934, 5.339405059814453, 5.500039100646973, 5.66067361831665, 5.82130765914917, 5.981942176818848, 6.142576217651367, 6.303210735321045, 6.4638447761535645, 6.624478816986084, 6.7851128578186035, 6.945747375488281, 7.106381416320801, 7.26701545715332, 7.42764949798584, 7.588284015655518, 7.748918056488037, 7.909552097320557, 8.070186614990234, 8.230820655822754, 8.391454696655273, 8.552088737487793]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 3.0, 4.0, 8.0, 7.0, 5.0, 13.0, 24.0, 38.0, 44.0, 49.0, 72.0, 95.0, 82.0, 94.0, 85.0, 80.0, 74.0, 61.0, 37.0, 32.0, 26.0, 15.0, 21.0, 10.0, 7.0, 9.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.585054874420166, -2.4972848892211914, -2.409514904022217, -2.321744918823242, -2.2339749336242676, -2.146204948425293, -2.0584349632263184, -1.9706652164459229, -1.8828952312469482, -1.7951252460479736, -1.707355260848999, -1.6195852756500244, -1.5318154096603394, -1.4440454244613647, -1.3562754392623901, -1.268505573272705, -1.180735468864441, -1.0929654836654663, -1.0051954984664917, -0.9174255728721619, -0.829655647277832, -0.7418856620788574, -0.6541156768798828, -0.566345751285553, -0.47857576608657837, -0.39080581068992615, -0.3030358552932739, -0.21526587009429932, -0.1274959146976471, -0.03972595930099487, 0.048044025897979736, 0.13581395149230957, 0.22358393669128418, 0.3113538920879364, 0.3991238474845886, 0.48689383268356323, 0.5746637582778931, 0.6624337434768677, 0.7502037286758423, 0.8379736542701721, 0.9257436394691467, 1.0135135650634766, 1.1012835502624512, 1.1890535354614258, 1.2768235206604004, 1.364593505859375, 1.4523634910583496, 1.5401333570480347, 1.6279033422470093, 1.7156733274459839, 1.8034433126449585, 1.8912131786346436, 1.9789831638336182, 2.0667531490325928, 2.1545231342315674, 2.242293119430542, 2.3300631046295166, 2.417833089828491, 2.505603075027466, 2.5933730602264404, 2.681143045425415, 2.7689127922058105, 2.856682777404785, 2.9444527626037598, 3.0322227478027344]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 6.0, 8.0, 6.0, 15.0, 27.0, 30.0, 45.0, 55.0, 88.0, 117.0, 166.0, 246.0, 351.0, 487.0, 761.0, 1073.0, 1659.0, 2739.0, 4374.0, 7843.0, 14667.0, 33647.0, 117876.0, 547799.0, 221257.0, 49483.0, 19535.0, 9669.0, 5390.0, 3179.0, 1980.0, 1326.0, 812.0, 548.0, 353.0, 281.0, 181.0, 150.0, 94.0, 66.0, 50.0, 28.0, 31.0, 20.0, 13.0, 8.0, 7.0, 9.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0673828125, -1.03369140625, -1.0, -0.96630859375, -0.9326171875, -0.89892578125, -0.865234375, -0.83154296875, -0.7978515625, -0.76416015625, -0.73046875, -0.69677734375, -0.6630859375, -0.62939453125, -0.595703125, -0.56201171875, -0.5283203125, -0.49462890625, -0.4609375, -0.42724609375, -0.3935546875, -0.35986328125, -0.326171875, -0.29248046875, -0.2587890625, -0.22509765625, -0.19140625, -0.15771484375, -0.1240234375, -0.09033203125, -0.056640625, -0.02294921875, 0.0107421875, 0.04443359375, 0.078125, 0.11181640625, 0.1455078125, 0.17919921875, 0.212890625, 0.24658203125, 0.2802734375, 0.31396484375, 0.34765625, 0.38134765625, 0.4150390625, 0.44873046875, 0.482421875, 0.51611328125, 0.5498046875, 0.58349609375, 0.6171875, 0.65087890625, 0.6845703125, 0.71826171875, 0.751953125, 0.78564453125, 0.8193359375, 0.85302734375, 0.88671875, 0.92041015625, 0.9541015625, 0.98779296875, 1.021484375, 1.05517578125, 1.0888671875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 1.0, 6.0, 3.0, 3.0, 10.0, 3.0, 5.0, 4.0, 15.0, 13.0, 13.0, 37.0, 43.0, 68.0, 94.0, 113.0, 126.0, 126.0, 80.0, 65.0, 43.0, 22.0, 22.0, 14.0, 9.0, 8.0, 12.0, 4.0, 9.0, 4.0, 5.0, 3.0, 4.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1741943359375, -0.1686725616455078, -0.16315078735351562, -0.15762901306152344, -0.15210723876953125, -0.14658546447753906, -0.14106369018554688, -0.1355419158935547, -0.1300201416015625, -0.12449836730957031, -0.11897659301757812, -0.11345481872558594, -0.10793304443359375, -0.10241127014160156, -0.09688949584960938, -0.09136772155761719, -0.085845947265625, -0.08032417297363281, -0.07480239868164062, -0.06928062438964844, -0.06375885009765625, -0.05823707580566406, -0.052715301513671875, -0.04719352722167969, -0.0416717529296875, -0.03614997863769531, -0.030628204345703125, -0.025106430053710938, -0.01958465576171875, -0.014062881469726562, -0.008541107177734375, -0.0030193328857421875, 0.00250244140625, 0.008024215698242188, 0.013545989990234375, 0.019067764282226562, 0.02458953857421875, 0.030111312866210938, 0.035633087158203125, 0.04115486145019531, 0.0466766357421875, 0.05219841003417969, 0.057720184326171875, 0.06324195861816406, 0.06876373291015625, 0.07428550720214844, 0.07980728149414062, 0.08532905578613281, 0.090850830078125, 0.09637260437011719, 0.10189437866210938, 0.10741615295410156, 0.11293792724609375, 0.11845970153808594, 0.12398147583007812, 0.1295032501220703, 0.1350250244140625, 0.1405467987060547, 0.14606857299804688, 0.15159034729003906, 0.15711212158203125, 0.16263389587402344, 0.16815567016601562, 0.1736774444580078, 0.17919921875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 10.0, 17.0, 28.0, 92.0, 193.0, 558.0, 1912.0, 8475.0, 48539.0, 393786.0, 518268.0, 62780.0, 10759.0, 2206.0, 599.0, 169.0, 89.0, 25.0, 10.0, 11.0, 8.0, 1.0, 3.0, 1.0, 6.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.44921875, -2.3910064697265625, -2.332794189453125, -2.2745819091796875, -2.21636962890625, -2.1581573486328125, -2.099945068359375, -2.0417327880859375, -1.9835205078125, -1.9253082275390625, -1.867095947265625, -1.8088836669921875, -1.75067138671875, -1.6924591064453125, -1.634246826171875, -1.5760345458984375, -1.517822265625, -1.4596099853515625, -1.401397705078125, -1.3431854248046875, -1.28497314453125, -1.2267608642578125, -1.168548583984375, -1.1103363037109375, -1.0521240234375, -0.9939117431640625, -0.935699462890625, -0.8774871826171875, -0.81927490234375, -0.7610626220703125, -0.702850341796875, -0.6446380615234375, -0.58642578125, -0.5282135009765625, -0.470001220703125, -0.4117889404296875, -0.35357666015625, -0.2953643798828125, -0.237152099609375, -0.1789398193359375, -0.1207275390625, -0.0625152587890625, -0.004302978515625, 0.0539093017578125, 0.11212158203125, 0.1703338623046875, 0.228546142578125, 0.2867584228515625, 0.344970703125, 0.4031829833984375, 0.461395263671875, 0.5196075439453125, 0.57781982421875, 0.6360321044921875, 0.694244384765625, 0.7524566650390625, 0.8106689453125, 0.8688812255859375, 0.927093505859375, 0.9853057861328125, 1.04351806640625, 1.1017303466796875, 1.159942626953125, 1.2181549072265625, 1.2763671875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 5.0, 3.0, 7.0, 4.0, 12.0, 10.0, 13.0, 15.0, 14.0, 25.0, 26.0, 28.0, 23.0, 37.0, 25.0, 43.0, 45.0, 44.0, 43.0, 45.0, 37.0, 32.0, 45.0, 52.0, 47.0, 39.0, 36.0, 39.0, 30.0, 24.0, 29.0, 17.0, 20.0, 18.0, 19.0, 6.0, 14.0, 4.0, 7.0, 8.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.7529296875, -0.7307281494140625, -0.708526611328125, -0.6863250732421875, -0.66412353515625, -0.6419219970703125, -0.619720458984375, -0.5975189208984375, -0.5753173828125, -0.5531158447265625, -0.530914306640625, -0.5087127685546875, -0.48651123046875, -0.4643096923828125, -0.442108154296875, -0.4199066162109375, -0.397705078125, -0.3755035400390625, -0.353302001953125, -0.3311004638671875, -0.30889892578125, -0.2866973876953125, -0.264495849609375, -0.2422943115234375, -0.2200927734375, -0.1978912353515625, -0.175689697265625, -0.1534881591796875, -0.13128662109375, -0.1090850830078125, -0.086883544921875, -0.0646820068359375, -0.04248046875, -0.0202789306640625, 0.001922607421875, 0.0241241455078125, 0.04632568359375, 0.0685272216796875, 0.090728759765625, 0.1129302978515625, 0.1351318359375, 0.1573333740234375, 0.179534912109375, 0.2017364501953125, 0.22393798828125, 0.2461395263671875, 0.268341064453125, 0.2905426025390625, 0.312744140625, 0.3349456787109375, 0.357147216796875, 0.3793487548828125, 0.40155029296875, 0.4237518310546875, 0.445953369140625, 0.4681549072265625, 0.4903564453125, 0.5125579833984375, 0.534759521484375, 0.5569610595703125, 0.57916259765625, 0.6013641357421875, 0.623565673828125, 0.6457672119140625, 0.66796875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 7.0, 21.0, 94.0, 569.0, 36103.0, 1009069.0, 2391.0, 212.0, 44.0, 17.0, 6.0, 3.0, 6.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.1015625, -7.8502197265625, -7.598876953125, -7.3475341796875, -7.09619140625, -6.8448486328125, -6.593505859375, -6.3421630859375, -6.0908203125, -5.8394775390625, -5.588134765625, -5.3367919921875, -5.08544921875, -4.8341064453125, -4.582763671875, -4.3314208984375, -4.080078125, -3.8287353515625, -3.577392578125, -3.3260498046875, -3.07470703125, -2.8233642578125, -2.572021484375, -2.3206787109375, -2.0693359375, -1.8179931640625, -1.566650390625, -1.3153076171875, -1.06396484375, -0.8126220703125, -0.561279296875, -0.3099365234375, -0.05859375, 0.1927490234375, 0.444091796875, 0.6954345703125, 0.94677734375, 1.1981201171875, 1.449462890625, 1.7008056640625, 1.9521484375, 2.2034912109375, 2.454833984375, 2.7061767578125, 2.95751953125, 3.2088623046875, 3.460205078125, 3.7115478515625, 3.962890625, 4.2142333984375, 4.465576171875, 4.7169189453125, 4.96826171875, 5.2196044921875, 5.470947265625, 5.7222900390625, 5.9736328125, 6.2249755859375, 6.476318359375, 6.7276611328125, 6.97900390625, 7.2303466796875, 7.481689453125, 7.7330322265625, 7.984375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 1.0, 6.0, 12.0, 7.0, 9.0, 9.0, 17.0, 38.0, 49.0, 71.0, 103.0, 134.0, 114.0, 111.0, 98.0, 64.0, 59.0, 38.0, 19.0, 13.0, 12.0, 9.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010782480239868164, -0.00010478310286998749, -0.00010174140334129333, -9.869970381259918e-05, -9.565800428390503e-05, -9.261630475521088e-05, -8.957460522651672e-05, -8.653290569782257e-05, -8.349120616912842e-05, -8.044950664043427e-05, -7.740780711174011e-05, -7.436610758304596e-05, -7.13244080543518e-05, -6.828270852565765e-05, -6.52410089969635e-05, -6.219930946826935e-05, -5.9157609939575195e-05, -5.611591041088104e-05, -5.307421088218689e-05, -5.003251135349274e-05, -4.6990811824798584e-05, -4.394911229610443e-05, -4.090741276741028e-05, -3.7865713238716125e-05, -3.482401371002197e-05, -3.178231418132782e-05, -2.8740614652633667e-05, -2.5698915123939514e-05, -2.265721559524536e-05, -1.961551606655121e-05, -1.6573816537857056e-05, -1.3532117009162903e-05, -1.049041748046875e-05, -7.448717951774597e-06, -4.407018423080444e-06, -1.3653188943862915e-06, 1.6763806343078613e-06, 4.718080163002014e-06, 7.759779691696167e-06, 1.080147922039032e-05, 1.3843178749084473e-05, 1.6884878277778625e-05, 1.992657780647278e-05, 2.296827733516693e-05, 2.6009976863861084e-05, 2.9051676392555237e-05, 3.209337592124939e-05, 3.513507544994354e-05, 3.8176774978637695e-05, 4.121847450733185e-05, 4.4260174036026e-05, 4.7301873564720154e-05, 5.034357309341431e-05, 5.338527262210846e-05, 5.642697215080261e-05, 5.9468671679496765e-05, 6.251037120819092e-05, 6.555207073688507e-05, 6.859377026557922e-05, 7.163546979427338e-05, 7.467716932296753e-05, 7.771886885166168e-05, 8.076056838035583e-05, 8.380226790904999e-05, 8.684396743774414e-05]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 7.0, 9.0, 16.0, 38.0, 45.0, 62.0, 105.0, 198.0, 353.0, 675.0, 1488.0, 3448.0, 10119.0, 40093.0, 223842.0, 584376.0, 141574.0, 28359.0, 7979.0, 2989.0, 1319.0, 648.0, 313.0, 164.0, 122.0, 83.0, 46.0, 22.0, 14.0, 13.0, 13.0, 7.0, 5.0, 6.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.86962890625, -0.8389816284179688, -0.8083343505859375, -0.7776870727539062, -0.747039794921875, -0.7163925170898438, -0.6857452392578125, -0.6550979614257812, -0.62445068359375, -0.5938034057617188, -0.5631561279296875, -0.5325088500976562, -0.501861572265625, -0.47121429443359375, -0.4405670166015625, -0.40991973876953125, -0.3792724609375, -0.34862518310546875, -0.3179779052734375, -0.28733062744140625, -0.256683349609375, -0.22603607177734375, -0.1953887939453125, -0.16474151611328125, -0.13409423828125, -0.10344696044921875, -0.0727996826171875, -0.04215240478515625, -0.011505126953125, 0.01914215087890625, 0.0497894287109375, 0.08043670654296875, 0.111083984375, 0.14173126220703125, 0.1723785400390625, 0.20302581787109375, 0.233673095703125, 0.26432037353515625, 0.2949676513671875, 0.32561492919921875, 0.35626220703125, 0.38690948486328125, 0.4175567626953125, 0.44820404052734375, 0.478851318359375, 0.5094985961914062, 0.5401458740234375, 0.5707931518554688, 0.6014404296875, 0.6320877075195312, 0.6627349853515625, 0.6933822631835938, 0.724029541015625, 0.7546768188476562, 0.7853240966796875, 0.8159713745117188, 0.84661865234375, 0.8772659301757812, 0.9079132080078125, 0.9385604858398438, 0.969207763671875, 0.9998550415039062, 1.0305023193359375, 1.0611495971679688, 1.091796875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 5.0, 2.0, 14.0, 10.0, 15.0, 18.0, 37.0, 55.0, 55.0, 57.0, 95.0, 108.0, 114.0, 107.0, 77.0, 66.0, 42.0, 31.0, 28.0, 19.0, 16.0, 12.0, 6.0, 4.0, 4.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6923828125, -0.6668853759765625, -0.641387939453125, -0.6158905029296875, -0.59039306640625, -0.5648956298828125, -0.539398193359375, -0.5139007568359375, -0.4884033203125, -0.4629058837890625, -0.437408447265625, -0.4119110107421875, -0.38641357421875, -0.3609161376953125, -0.335418701171875, -0.3099212646484375, -0.284423828125, -0.2589263916015625, -0.233428955078125, -0.2079315185546875, -0.18243408203125, -0.1569366455078125, -0.131439208984375, -0.1059417724609375, -0.0804443359375, -0.0549468994140625, -0.029449462890625, -0.0039520263671875, 0.02154541015625, 0.0470428466796875, 0.072540283203125, 0.0980377197265625, 0.12353515625, 0.1490325927734375, 0.174530029296875, 0.2000274658203125, 0.22552490234375, 0.2510223388671875, 0.276519775390625, 0.3020172119140625, 0.3275146484375, 0.3530120849609375, 0.378509521484375, 0.4040069580078125, 0.42950439453125, 0.4550018310546875, 0.480499267578125, 0.5059967041015625, 0.531494140625, 0.5569915771484375, 0.582489013671875, 0.6079864501953125, 0.63348388671875, 0.6589813232421875, 0.684478759765625, 0.7099761962890625, 0.7354736328125, 0.7609710693359375, 0.786468505859375, 0.8119659423828125, 0.83746337890625, 0.8629608154296875, 0.888458251953125, 0.9139556884765625, 0.939453125]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 4.0, 1.0, 7.0, 7.0, 34.0, 78.0, 232.0, 359.0, 174.0, 63.0, 24.0, 9.0, 8.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.288938522338867, -12.865629196166992, -12.442319869995117, -12.019010543823242, -11.595702171325684, -11.172392845153809, -10.749083518981934, -10.325774192810059, -9.902464866638184, -9.479155540466309, -9.055846214294434, -8.632537841796875, -8.209228515625, -7.785919189453125, -7.36260986328125, -6.939300537109375, -6.515991687774658, -6.092682361602783, -5.669373512268066, -5.246064186096191, -4.822754859924316, -4.399445533752441, -3.9761366844177246, -3.5528273582458496, -3.1295182704925537, -2.706209182739258, -2.282899856567383, -1.859590768814087, -1.4362815618515015, -1.012972354888916, -0.5896632671356201, -0.16635394096374512, 0.2569551467895508, 0.6802643537521362, 1.1035735607147217, 1.5268826484680176, 1.950191855430603, 2.3735010623931885, 2.7968101501464844, 3.2201194763183594, 3.6434285640716553, 4.066737651824951, 4.490046977996826, 4.913355827331543, 5.336665153503418, 5.759974479675293, 6.183283805847168, 6.606593132019043, 7.02990198135376, 7.453211307525635, 7.876520156860352, 8.299829483032227, 8.723138809204102, 9.146448135375977, 9.569757461547852, 9.993066787719727, 10.416375160217285, 10.83968448638916, 11.262993812561035, 11.686302185058594, 12.109611511230469, 12.532920837402344, 12.956230163574219, 13.379539489746094, 13.802848815917969]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 0.0, 5.0, 3.0, 1.0, 5.0, 1.0, 3.0, 4.0, 9.0, 17.0, 17.0, 21.0, 31.0, 48.0, 63.0, 78.0, 99.0, 126.0, 96.0, 89.0, 80.0, 77.0, 43.0, 25.0, 18.0, 17.0, 6.0, 4.0, 2.0, 2.0, 2.0, 4.0, 4.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-11.368463516235352, -11.058740615844727, -10.749017715454102, -10.43929386138916, -10.129570960998535, -9.81984806060791, -9.510124206542969, -9.200401306152344, -8.890678405761719, -8.580955505371094, -8.271232604980469, -7.961508750915527, -7.651785850524902, -7.342062950134277, -7.032339572906494, -6.722616195678711, -6.412893295288086, -6.103170394897461, -5.793447017669678, -5.4837236404418945, -5.1740007400512695, -4.8642778396606445, -4.554554462432861, -4.244831085205078, -3.935108184814453, -3.625385046005249, -3.315661907196045, -3.005938768386841, -2.6962156295776367, -2.3864924907684326, -2.0767693519592285, -1.7670462131500244, -1.4573240280151367, -1.1476008892059326, -0.8378777503967285, -0.5281546115875244, -0.2184314727783203, 0.09129166603088379, 0.4010148048400879, 0.710737943649292, 1.020461082458496, 1.3301842212677002, 1.6399073600769043, 1.9496304988861084, 2.2593536376953125, 2.5690767765045166, 2.8787999153137207, 3.188523054122925, 3.498246192932129, 3.807969331741333, 4.117692470550537, 4.42741584777832, 4.737138748168945, 5.04686164855957, 5.3565850257873535, 5.666308403015137, 5.976031303405762, 6.285754203796387, 6.59547758102417, 6.905200958251953, 7.214923858642578, 7.524646759033203, 7.834370136260986, 8.14409351348877, 8.453816413879395]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 6.0, 5.0, 3.0, 6.0, 9.0, 15.0, 11.0, 26.0, 30.0, 56.0, 59.0, 89.0, 133.0, 226.0, 287.0, 509.0, 854.0, 1990.0, 4732.0, 18400.0, 533718.0, 3598484.0, 24700.0, 5617.0, 2055.0, 945.0, 476.0, 295.0, 190.0, 108.0, 85.0, 51.0, 38.0, 27.0, 18.0, 10.0, 11.0, 6.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.6171875, -6.43377685546875, -6.2503662109375, -6.06695556640625, -5.883544921875, -5.70013427734375, -5.5167236328125, -5.33331298828125, -5.14990234375, -4.96649169921875, -4.7830810546875, -4.59967041015625, -4.416259765625, -4.23284912109375, -4.0494384765625, -3.86602783203125, -3.6826171875, -3.49920654296875, -3.3157958984375, -3.13238525390625, -2.948974609375, -2.76556396484375, -2.5821533203125, -2.39874267578125, -2.21533203125, -2.03192138671875, -1.8485107421875, -1.66510009765625, -1.481689453125, -1.29827880859375, -1.1148681640625, -0.93145751953125, -0.748046875, -0.56463623046875, -0.3812255859375, -0.19781494140625, -0.014404296875, 0.16900634765625, 0.3524169921875, 0.53582763671875, 0.71923828125, 0.90264892578125, 1.0860595703125, 1.26947021484375, 1.452880859375, 1.63629150390625, 1.8197021484375, 2.00311279296875, 2.1865234375, 2.36993408203125, 2.5533447265625, 2.73675537109375, 2.920166015625, 3.10357666015625, 3.2869873046875, 3.47039794921875, 3.65380859375, 3.83721923828125, 4.0206298828125, 4.20404052734375, 4.387451171875, 4.57086181640625, 4.7542724609375, 4.93768310546875, 5.12109375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 4.0, 5.0, 6.0, 9.0, 12.0, 18.0, 20.0, 29.0, 59.0, 76.0, 107.0, 118.0, 121.0, 106.0, 102.0, 57.0, 45.0, 18.0, 24.0, 8.0, 11.0, 9.0, 8.0, 3.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2193603515625, -0.2125415802001953, -0.20572280883789062, -0.19890403747558594, -0.19208526611328125, -0.18526649475097656, -0.17844772338867188, -0.1716289520263672, -0.1648101806640625, -0.1579914093017578, -0.15117263793945312, -0.14435386657714844, -0.13753509521484375, -0.13071632385253906, -0.12389755249023438, -0.11707878112792969, -0.110260009765625, -0.10344123840332031, -0.09662246704101562, -0.08980369567871094, -0.08298492431640625, -0.07616615295410156, -0.06934738159179688, -0.06252861022949219, -0.0557098388671875, -0.04889106750488281, -0.042072296142578125, -0.03525352478027344, -0.02843475341796875, -0.021615982055664062, -0.014797210693359375, -0.007978439331054688, -0.00115966796875, 0.0056591033935546875, 0.012477874755859375, 0.019296646118164062, 0.02611541748046875, 0.03293418884277344, 0.039752960205078125, 0.04657173156738281, 0.0533905029296875, 0.06020927429199219, 0.06702804565429688, 0.07384681701660156, 0.08066558837890625, 0.08748435974121094, 0.09430313110351562, 0.10112190246582031, 0.107940673828125, 0.11475944519042969, 0.12157821655273438, 0.12839698791503906, 0.13521575927734375, 0.14203453063964844, 0.14885330200195312, 0.1556720733642578, 0.1624908447265625, 0.1693096160888672, 0.17612838745117188, 0.18294715881347656, 0.18976593017578125, 0.19658470153808594, 0.20340347290039062, 0.2102222442626953, 0.217041015625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 5.0, 3.0, 9.0, 6.0, 19.0, 19.0, 31.0, 31.0, 59.0, 78.0, 158.0, 789.0, 333734.0, 3857683.0, 1167.0, 195.0, 89.0, 68.0, 45.0, 33.0, 19.0, 11.0, 9.0, 7.0, 8.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.109375, -12.541015625, -11.97265625, -11.404296875, -10.8359375, -10.267578125, -9.69921875, -9.130859375, -8.5625, -7.994140625, -7.42578125, -6.857421875, -6.2890625, -5.720703125, -5.15234375, -4.583984375, -4.015625, -3.447265625, -2.87890625, -2.310546875, -1.7421875, -1.173828125, -0.60546875, -0.037109375, 0.53125, 1.099609375, 1.66796875, 2.236328125, 2.8046875, 3.373046875, 3.94140625, 4.509765625, 5.078125, 5.646484375, 6.21484375, 6.783203125, 7.3515625, 7.919921875, 8.48828125, 9.056640625, 9.625, 10.193359375, 10.76171875, 11.330078125, 11.8984375, 12.466796875, 13.03515625, 13.603515625, 14.171875, 14.740234375, 15.30859375, 15.876953125, 16.4453125, 17.013671875, 17.58203125, 18.150390625, 18.71875, 19.287109375, 19.85546875, 20.423828125, 20.9921875, 21.560546875, 22.12890625, 22.697265625, 23.265625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 3.0, 18.0, 7.0, 18.0, 24.0, 32.0, 51.0, 83.0, 129.0, 219.0, 441.0, 1678.0, 713.0, 257.0, 124.0, 75.0, 52.0, 42.0, 32.0, 25.0, 12.0, 10.0, 7.0, 5.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.5732421875, -0.5584335327148438, -0.5436248779296875, -0.5288162231445312, -0.514007568359375, -0.49919891357421875, -0.4843902587890625, -0.46958160400390625, -0.45477294921875, -0.43996429443359375, -0.4251556396484375, -0.41034698486328125, -0.395538330078125, -0.38072967529296875, -0.3659210205078125, -0.35111236572265625, -0.3363037109375, -0.32149505615234375, -0.3066864013671875, -0.29187774658203125, -0.277069091796875, -0.26226043701171875, -0.2474517822265625, -0.23264312744140625, -0.21783447265625, -0.20302581787109375, -0.1882171630859375, -0.17340850830078125, -0.158599853515625, -0.14379119873046875, -0.1289825439453125, -0.11417388916015625, -0.099365234375, -0.08455657958984375, -0.0697479248046875, -0.05493927001953125, -0.040130615234375, -0.02532196044921875, -0.0105133056640625, 0.00429534912109375, 0.01910400390625, 0.03391265869140625, 0.0487213134765625, 0.06352996826171875, 0.078338623046875, 0.09314727783203125, 0.1079559326171875, 0.12276458740234375, 0.1375732421875, 0.15238189697265625, 0.1671905517578125, 0.18199920654296875, 0.196807861328125, 0.21161651611328125, 0.2264251708984375, 0.24123382568359375, 0.25604248046875, 0.27085113525390625, 0.2856597900390625, 0.30046844482421875, 0.315277099609375, 0.33008575439453125, 0.3448944091796875, 0.35970306396484375, 0.37451171875]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 4.0, 3.0, 7.0, 6.0, 15.0, 22.0, 19.0, 29.0, 62.0, 88.0, 173.0, 159.0, 143.0, 104.0, 68.0, 34.0, 24.0, 12.0, 10.0, 9.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.378148317337036, -2.3036506175994873, -2.2291531562805176, -2.1546554565429688, -2.08015775680542, -2.00566029548645, -1.9311625957489014, -1.856665015220642, -1.7821674346923828, -1.7076698541641235, -1.6331722736358643, -1.5586745738983154, -1.4841769933700562, -1.4096794128417969, -1.335181713104248, -1.2606841325759888, -1.1861865520477295, -1.1116889715194702, -1.037191390991211, -0.9626936912536621, -0.8881961107254028, -0.8136985301971436, -0.7392008900642395, -0.6647032499313354, -0.5902056694030762, -0.5157080888748169, -0.44121044874191284, -0.3667128384113312, -0.2922152280807495, -0.21771761775016785, -0.14322000741958618, -0.06872236728668213, 0.005774974822998047, 0.08027258515357971, 0.15477019548416138, 0.22926780581474304, 0.3037654161453247, 0.37826302647590637, 0.45276063680648804, 0.5272582769393921, 0.6017558574676514, 0.6762534379959106, 0.7507510781288147, 0.8252487182617188, 0.899746298789978, 0.9742438793182373, 1.0487415790557861, 1.1232391595840454, 1.1977367401123047, 1.272234320640564, 1.3467319011688232, 1.421229600906372, 1.4957271814346313, 1.5702247619628906, 1.6447224617004395, 1.7192200422286987, 1.793717622756958, 1.8682152032852173, 1.9427127838134766, 2.0172104835510254, 2.091708183288574, 2.166205644607544, 2.2407033443450928, 2.3152008056640625, 2.3896985054016113]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 6.0, 6.0, 6.0, 12.0, 19.0, 22.0, 18.0, 26.0, 35.0, 41.0, 38.0, 48.0, 57.0, 67.0, 67.0, 52.0, 66.0, 65.0, 55.0, 51.0, 56.0, 47.0, 30.0, 19.0, 22.0, 16.0, 17.0, 8.0, 5.0, 8.0, 4.0, 5.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7533705234527588, -1.6853567361831665, -1.6173430681228638, -1.5493292808532715, -1.4813156127929688, -1.4133018255233765, -1.3452880382537842, -1.2772743701934814, -1.2092607021331787, -1.1412469148635864, -1.0732332468032837, -1.0052194595336914, -0.9372057914733887, -0.8691920042037964, -0.8011782765388489, -0.7331645488739014, -0.6651507616043091, -0.5971370339393616, -0.5291233062744141, -0.46110954880714417, -0.39309582114219666, -0.32508209347724915, -0.25706833600997925, -0.18905460834503174, -0.12104088068008423, -0.05302714556455612, 0.014986589550971985, 0.08300033211708069, 0.1510140597820282, 0.2190277874469757, 0.2870415449142456, 0.3550552725791931, 0.4230690002441406, 0.49108272790908813, 0.5590964555740356, 0.6271102428436279, 0.6951239109039307, 0.763137698173523, 0.8311514258384705, 0.899165153503418, 0.9671788811683655, 1.035192608833313, 1.1032063961029053, 1.171220064163208, 1.2392338514328003, 1.307247519493103, 1.3752613067626953, 1.443274974822998, 1.5112887620925903, 1.5793025493621826, 1.6473162174224854, 1.7153300046920776, 1.7833436727523804, 1.8513574600219727, 1.9193711280822754, 1.9873849153518677, 2.05539870262146, 2.1234123706817627, 2.1914262771606445, 2.2594399452209473, 2.32745361328125, 2.3954672813415527, 2.4634811878204346, 2.5314948558807373, 2.59950852394104]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 2.0, 10.0, 6.0, 10.0, 14.0, 20.0, 30.0, 41.0, 52.0, 82.0, 131.0, 186.0, 320.0, 461.0, 900.0, 1833.0, 4715.0, 16211.0, 99137.0, 705809.0, 183069.0, 24219.0, 6231.0, 2336.0, 1087.0, 611.0, 349.0, 218.0, 142.0, 107.0, 79.0, 41.0, 22.0, 24.0, 13.0, 10.0, 6.0, 4.0, 2.0, 5.0, 0.0, 4.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0, 1.0], "bins": [-2.478515625, -2.404815673828125, -2.33111572265625, -2.257415771484375, -2.1837158203125, -2.110015869140625, -2.03631591796875, -1.962615966796875, -1.888916015625, -1.815216064453125, -1.74151611328125, -1.667816162109375, -1.5941162109375, -1.520416259765625, -1.44671630859375, -1.373016357421875, -1.29931640625, -1.225616455078125, -1.15191650390625, -1.078216552734375, -1.0045166015625, -0.930816650390625, -0.85711669921875, -0.783416748046875, -0.709716796875, -0.636016845703125, -0.56231689453125, -0.488616943359375, -0.4149169921875, -0.341217041015625, -0.26751708984375, -0.193817138671875, -0.1201171875, -0.046417236328125, 0.02728271484375, 0.100982666015625, 0.1746826171875, 0.248382568359375, 0.32208251953125, 0.395782470703125, 0.469482421875, 0.543182373046875, 0.61688232421875, 0.690582275390625, 0.7642822265625, 0.837982177734375, 0.91168212890625, 0.985382080078125, 1.05908203125, 1.132781982421875, 1.20648193359375, 1.280181884765625, 1.3538818359375, 1.427581787109375, 1.50128173828125, 1.574981689453125, 1.648681640625, 1.722381591796875, 1.79608154296875, 1.869781494140625, 1.9434814453125, 2.017181396484375, 2.09088134765625, 2.164581298828125, 2.23828125]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 7.0, 3.0, 6.0, 7.0, 14.0, 21.0, 35.0, 67.0, 69.0, 99.0, 116.0, 135.0, 114.0, 103.0, 69.0, 50.0, 26.0, 19.0, 18.0, 8.0, 7.0, 6.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.210205078125, -0.20248031616210938, -0.19475555419921875, -0.18703079223632812, -0.1793060302734375, -0.17158126831054688, -0.16385650634765625, -0.15613174438476562, -0.148406982421875, -0.14068222045898438, -0.13295745849609375, -0.12523269653320312, -0.1175079345703125, -0.10978317260742188, -0.10205841064453125, -0.09433364868164062, -0.08660888671875, -0.07888412475585938, -0.07115936279296875, -0.06343460083007812, -0.0557098388671875, -0.047985076904296875, -0.04026031494140625, -0.032535552978515625, -0.024810791015625, -0.017086029052734375, -0.00936126708984375, -0.001636505126953125, 0.0060882568359375, 0.013813018798828125, 0.02153778076171875, 0.029262542724609375, 0.0369873046875, 0.044712066650390625, 0.05243682861328125, 0.060161590576171875, 0.0678863525390625, 0.07561111450195312, 0.08333587646484375, 0.09106063842773438, 0.098785400390625, 0.10651016235351562, 0.11423492431640625, 0.12195968627929688, 0.1296844482421875, 0.13740921020507812, 0.14513397216796875, 0.15285873413085938, 0.16058349609375, 0.16830825805664062, 0.17603302001953125, 0.18375778198242188, 0.1914825439453125, 0.19920730590820312, 0.20693206787109375, 0.21465682983398438, 0.222381591796875, 0.23010635375976562, 0.23783111572265625, 0.24555587768554688, 0.2532806396484375, 0.2610054016113281, 0.26873016357421875, 0.2764549255371094, 0.2841796875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 6.0, 7.0, 8.0, 14.0, 21.0, 27.0, 37.0, 54.0, 90.0, 110.0, 179.0, 247.0, 421.0, 605.0, 1013.0, 1685.0, 2929.0, 5146.0, 9695.0, 18800.0, 38538.0, 87884.0, 233314.0, 356271.0, 164350.0, 64836.0, 29671.0, 14534.0, 7522.0, 4219.0, 2426.0, 1386.0, 909.0, 567.0, 329.0, 205.0, 158.0, 105.0, 75.0, 51.0, 31.0, 23.0, 17.0, 14.0, 7.0, 9.0, 5.0, 5.0, 3.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.07421875, -1.0375823974609375, -1.000946044921875, -0.9643096923828125, -0.92767333984375, -0.8910369873046875, -0.854400634765625, -0.8177642822265625, -0.7811279296875, -0.7444915771484375, -0.707855224609375, -0.6712188720703125, -0.63458251953125, -0.5979461669921875, -0.561309814453125, -0.5246734619140625, -0.488037109375, -0.4514007568359375, -0.414764404296875, -0.3781280517578125, -0.34149169921875, -0.3048553466796875, -0.268218994140625, -0.2315826416015625, -0.1949462890625, -0.1583099365234375, -0.121673583984375, -0.0850372314453125, -0.04840087890625, -0.0117645263671875, 0.024871826171875, 0.0615081787109375, 0.09814453125, 0.1347808837890625, 0.171417236328125, 0.2080535888671875, 0.24468994140625, 0.2813262939453125, 0.317962646484375, 0.3545989990234375, 0.3912353515625, 0.4278717041015625, 0.464508056640625, 0.5011444091796875, 0.53778076171875, 0.5744171142578125, 0.611053466796875, 0.6476898193359375, 0.684326171875, 0.7209625244140625, 0.757598876953125, 0.7942352294921875, 0.83087158203125, 0.8675079345703125, 0.904144287109375, 0.9407806396484375, 0.9774169921875, 1.0140533447265625, 1.050689697265625, 1.0873260498046875, 1.12396240234375, 1.1605987548828125, 1.197235107421875, 1.2338714599609375, 1.2705078125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 1.0, 5.0, 2.0, 7.0, 7.0, 8.0, 7.0, 8.0, 5.0, 17.0, 21.0, 22.0, 18.0, 24.0, 21.0, 37.0, 41.0, 25.0, 46.0, 46.0, 33.0, 41.0, 55.0, 60.0, 37.0, 53.0, 34.0, 35.0, 39.0, 32.0, 25.0, 28.0, 35.0, 29.0, 24.0, 14.0, 12.0, 16.0, 4.0, 7.0, 6.0, 3.0, 4.0, 6.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.92138671875, -0.8895187377929688, -0.8576507568359375, -0.8257827758789062, -0.793914794921875, -0.7620468139648438, -0.7301788330078125, -0.6983108520507812, -0.66644287109375, -0.6345748901367188, -0.6027069091796875, -0.5708389282226562, -0.538970947265625, -0.5071029663085938, -0.4752349853515625, -0.44336700439453125, -0.4114990234375, -0.37963104248046875, -0.3477630615234375, -0.31589508056640625, -0.284027099609375, -0.25215911865234375, -0.2202911376953125, -0.18842315673828125, -0.15655517578125, -0.12468719482421875, -0.0928192138671875, -0.06095123291015625, -0.029083251953125, 0.00278472900390625, 0.0346527099609375, 0.06652069091796875, 0.098388671875, 0.13025665283203125, 0.1621246337890625, 0.19399261474609375, 0.225860595703125, 0.25772857666015625, 0.2895965576171875, 0.32146453857421875, 0.35333251953125, 0.38520050048828125, 0.4170684814453125, 0.44893646240234375, 0.480804443359375, 0.5126724243164062, 0.5445404052734375, 0.5764083862304688, 0.6082763671875, 0.6401443481445312, 0.6720123291015625, 0.7038803100585938, 0.735748291015625, 0.7676162719726562, 0.7994842529296875, 0.8313522338867188, 0.86322021484375, 0.8950881958007812, 0.9269561767578125, 0.9588241577148438, 0.990692138671875, 1.0225601196289062, 1.0544281005859375, 1.0862960815429688, 1.1181640625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 2.0, 6.0, 7.0, 6.0, 12.0, 13.0, 31.0, 36.0, 52.0, 67.0, 125.0, 199.0, 372.0, 735.0, 1617.0, 4382.0, 16346.0, 108219.0, 674712.0, 206463.0, 25172.0, 5849.0, 2118.0, 894.0, 437.0, 253.0, 148.0, 89.0, 63.0, 31.0, 32.0, 14.0, 18.0, 9.0, 8.0, 9.0, 5.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.505859375, -1.459716796875, -1.41357421875, -1.367431640625, -1.3212890625, -1.275146484375, -1.22900390625, -1.182861328125, -1.13671875, -1.090576171875, -1.04443359375, -0.998291015625, -0.9521484375, -0.906005859375, -0.85986328125, -0.813720703125, -0.767578125, -0.721435546875, -0.67529296875, -0.629150390625, -0.5830078125, -0.536865234375, -0.49072265625, -0.444580078125, -0.3984375, -0.352294921875, -0.30615234375, -0.260009765625, -0.2138671875, -0.167724609375, -0.12158203125, -0.075439453125, -0.029296875, 0.016845703125, 0.06298828125, 0.109130859375, 0.1552734375, 0.201416015625, 0.24755859375, 0.293701171875, 0.33984375, 0.385986328125, 0.43212890625, 0.478271484375, 0.5244140625, 0.570556640625, 0.61669921875, 0.662841796875, 0.708984375, 0.755126953125, 0.80126953125, 0.847412109375, 0.8935546875, 0.939697265625, 0.98583984375, 1.031982421875, 1.078125, 1.124267578125, 1.17041015625, 1.216552734375, 1.2626953125, 1.308837890625, 1.35498046875, 1.401123046875, 1.447265625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 5.0, 6.0, 9.0, 13.0, 12.0, 24.0, 19.0, 34.0, 43.0, 51.0, 64.0, 67.0, 100.0, 110.0, 93.0, 71.0, 59.0, 46.0, 36.0, 31.0, 30.0, 20.0, 17.0, 15.0, 5.0, 4.0, 5.0, 7.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00013208389282226562, -0.00012873392552137375, -0.00012538395822048187, -0.00012203399091959, -0.00011868402361869812, -0.00011533405631780624, -0.00011198408901691437, -0.00010863412171602249, -0.00010528415441513062, -0.00010193418711423874, -9.858421981334686e-05, -9.523425251245499e-05, -9.188428521156311e-05, -8.853431791067123e-05, -8.518435060977936e-05, -8.183438330888748e-05, -7.84844160079956e-05, -7.513444870710373e-05, -7.178448140621185e-05, -6.843451410531998e-05, -6.50845468044281e-05, -6.173457950353622e-05, -5.838461220264435e-05, -5.503464490175247e-05, -5.1684677600860596e-05, -4.833471029996872e-05, -4.498474299907684e-05, -4.163477569818497e-05, -3.828480839729309e-05, -3.4934841096401215e-05, -3.158487379550934e-05, -2.8234906494617462e-05, -2.4884939193725586e-05, -2.153497189283371e-05, -1.8185004591941833e-05, -1.4835037291049957e-05, -1.1485069990158081e-05, -8.135102689266205e-06, -4.785135388374329e-06, -1.4351680874824524e-06, 1.914799213409424e-06, 5.2647665143013e-06, 8.614733815193176e-06, 1.1964701116085052e-05, 1.531466841697693e-05, 1.8664635717868805e-05, 2.201460301876068e-05, 2.5364570319652557e-05, 2.8714537620544434e-05, 3.206450492143631e-05, 3.5414472222328186e-05, 3.876443952322006e-05, 4.211440682411194e-05, 4.5464374125003815e-05, 4.881434142589569e-05, 5.216430872678757e-05, 5.551427602767944e-05, 5.886424332857132e-05, 6.22142106294632e-05, 6.556417793035507e-05, 6.891414523124695e-05, 7.226411253213882e-05, 7.56140798330307e-05, 7.896404713392258e-05, 8.231401443481445e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 1.0, 5.0, 6.0, 7.0, 10.0, 14.0, 24.0, 28.0, 63.0, 98.0, 195.0, 362.0, 912.0, 2739.0, 12808.0, 245221.0, 748810.0, 30382.0, 4399.0, 1324.0, 527.0, 268.0, 132.0, 96.0, 34.0, 26.0, 19.0, 18.0, 8.0, 6.0, 4.0, 5.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.58203125, -2.504241943359375, -2.42645263671875, -2.348663330078125, -2.2708740234375, -2.193084716796875, -2.11529541015625, -2.037506103515625, -1.959716796875, -1.881927490234375, -1.80413818359375, -1.726348876953125, -1.6485595703125, -1.570770263671875, -1.49298095703125, -1.415191650390625, -1.33740234375, -1.259613037109375, -1.18182373046875, -1.104034423828125, -1.0262451171875, -0.948455810546875, -0.87066650390625, -0.792877197265625, -0.715087890625, -0.637298583984375, -0.55950927734375, -0.481719970703125, -0.4039306640625, -0.326141357421875, -0.24835205078125, -0.170562744140625, -0.0927734375, -0.014984130859375, 0.06280517578125, 0.140594482421875, 0.2183837890625, 0.296173095703125, 0.37396240234375, 0.451751708984375, 0.529541015625, 0.607330322265625, 0.68511962890625, 0.762908935546875, 0.8406982421875, 0.918487548828125, 0.99627685546875, 1.074066162109375, 1.15185546875, 1.229644775390625, 1.30743408203125, 1.385223388671875, 1.4630126953125, 1.540802001953125, 1.61859130859375, 1.696380615234375, 1.774169921875, 1.851959228515625, 1.92974853515625, 2.007537841796875, 2.0853271484375, 2.163116455078125, 2.24090576171875, 2.318695068359375, 2.396484375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 3.0, 11.0, 12.0, 27.0, 42.0, 49.0, 82.0, 102.0, 144.0, 141.0, 138.0, 76.0, 76.0, 44.0, 24.0, 13.0, 5.0, 10.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6318359375, -0.6004791259765625, -0.569122314453125, -0.5377655029296875, -0.50640869140625, -0.4750518798828125, -0.443695068359375, -0.4123382568359375, -0.3809814453125, -0.3496246337890625, -0.318267822265625, -0.2869110107421875, -0.25555419921875, -0.2241973876953125, -0.192840576171875, -0.1614837646484375, -0.130126953125, -0.0987701416015625, -0.067413330078125, -0.0360565185546875, -0.00469970703125, 0.0266571044921875, 0.058013916015625, 0.0893707275390625, 0.1207275390625, 0.1520843505859375, 0.183441162109375, 0.2147979736328125, 0.24615478515625, 0.2775115966796875, 0.308868408203125, 0.3402252197265625, 0.37158203125, 0.4029388427734375, 0.434295654296875, 0.4656524658203125, 0.49700927734375, 0.5283660888671875, 0.559722900390625, 0.5910797119140625, 0.6224365234375, 0.6537933349609375, 0.685150146484375, 0.7165069580078125, 0.74786376953125, 0.7792205810546875, 0.810577392578125, 0.8419342041015625, 0.873291015625, 0.9046478271484375, 0.936004638671875, 0.9673614501953125, 0.99871826171875, 1.0300750732421875, 1.061431884765625, 1.0927886962890625, 1.1241455078125, 1.1555023193359375, 1.186859130859375, 1.2182159423828125, 1.24957275390625, 1.2809295654296875, 1.312286376953125, 1.3436431884765625, 1.375]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 0.0, 2.0, 2.0, 7.0, 9.0, 4.0, 8.0, 14.0, 25.0, 53.0, 83.0, 138.0, 201.0, 191.0, 122.0, 57.0, 30.0, 21.0, 13.0, 10.0, 7.0, 3.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.404948234558105, -10.979870796203613, -10.554794311523438, -10.129716873168945, -9.704639434814453, -9.279562950134277, -8.854485511779785, -8.42940902709961, -8.004331588745117, -7.579254627227783, -7.154177665710449, -6.729100227355957, -6.304023265838623, -5.878946304321289, -5.453868865966797, -5.028791904449463, -4.603714942932129, -4.178637981414795, -3.753560781478882, -3.3284835815429688, -2.9034066200256348, -2.478329658508301, -2.0532524585723877, -1.6281752586364746, -1.2030982971191406, -0.7780212163925171, -0.35294413566589355, 0.07213294506072998, 0.4972100257873535, 0.9222869873046875, 1.3473641872406006, 1.7724413871765137, 2.197519302368164, 2.622596263885498, 3.047673463821411, 3.472750663757324, 3.897827625274658, 4.322904586791992, 4.747982025146484, 5.173058986663818, 5.598135948181152, 6.023212909698486, 6.44828987121582, 6.8733673095703125, 7.2984442710876465, 7.7235212326049805, 8.148598670959473, 8.573675155639648, 8.99875259399414, 9.423830032348633, 9.848906517028809, 10.2739839553833, 10.699060440063477, 11.124137878417969, 11.549215316772461, 11.974292755126953, 12.399369239807129, 12.824446678161621, 13.249523162841797, 13.674600601196289, 14.099678039550781, 14.524754524230957, 14.94983196258545, 15.374908447265625, 15.799985885620117]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 8.0, 9.0, 15.0, 15.0, 25.0, 40.0, 37.0, 45.0, 85.0, 65.0, 84.0, 83.0, 81.0, 90.0, 82.0, 61.0, 43.0, 40.0, 19.0, 19.0, 14.0, 16.0, 11.0, 7.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.438114166259766, -13.978090286254883, -13.518067359924316, -13.058043479919434, -12.598020553588867, -12.137996673583984, -11.677972793579102, -11.217948913574219, -10.757925987243652, -10.29790210723877, -9.837879180908203, -9.37785530090332, -8.917831420898438, -8.457808494567871, -7.997784614562988, -7.537761211395264, -7.077737808227539, -6.6177144050598145, -6.15769100189209, -5.697667121887207, -5.237643718719482, -4.777620315551758, -4.317596435546875, -3.8575730323791504, -3.397549629211426, -2.937526226043701, -2.4775025844573975, -2.0174789428710938, -1.5574555397033691, -1.0974321365356445, -0.6374084949493408, -0.1773848533630371, 0.2826385498046875, 0.7426620721817017, 1.2026855945587158, 1.66270911693573, 2.122732639312744, 2.5827560424804688, 3.0427796840667725, 3.502803325653076, 3.962826728820801, 4.422850131988525, 4.88287353515625, 5.342897415161133, 5.802920818328857, 6.262944221496582, 6.722968101501465, 7.1829915046691895, 7.643014907836914, 8.103038787841797, 8.563061714172363, 9.023085594177246, 9.483108520507812, 9.943132400512695, 10.403156280517578, 10.863180160522461, 11.323203086853027, 11.78322696685791, 12.243249893188477, 12.70327377319336, 13.163297653198242, 13.623320579528809, 14.083344459533691, 14.543367385864258, 15.00339126586914]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 8.0, 5.0, 16.0, 22.0, 39.0, 96.0, 187.0, 373.0, 1015.0, 4843.0, 242356.0, 3936734.0, 6964.0, 1058.0, 333.0, 124.0, 50.0, 27.0, 14.0, 9.0, 7.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-22.390625, -21.786865234375, -21.18310546875, -20.579345703125, -19.9755859375, -19.371826171875, -18.76806640625, -18.164306640625, -17.560546875, -16.956787109375, -16.35302734375, -15.749267578125, -15.1455078125, -14.541748046875, -13.93798828125, -13.334228515625, -12.73046875, -12.126708984375, -11.52294921875, -10.919189453125, -10.3154296875, -9.711669921875, -9.10791015625, -8.504150390625, -7.900390625, -7.296630859375, -6.69287109375, -6.089111328125, -5.4853515625, -4.881591796875, -4.27783203125, -3.674072265625, -3.0703125, -2.466552734375, -1.86279296875, -1.259033203125, -0.6552734375, -0.051513671875, 0.55224609375, 1.156005859375, 1.759765625, 2.363525390625, 2.96728515625, 3.571044921875, 4.1748046875, 4.778564453125, 5.38232421875, 5.986083984375, 6.58984375, 7.193603515625, 7.79736328125, 8.401123046875, 9.0048828125, 9.608642578125, 10.21240234375, 10.816162109375, 11.419921875, 12.023681640625, 12.62744140625, 13.231201171875, 13.8349609375, 14.438720703125, 15.04248046875, 15.646240234375, 16.25]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 7.0, 9.0, 19.0, 30.0, 31.0, 70.0, 92.0, 117.0, 142.0, 130.0, 118.0, 87.0, 46.0, 39.0, 22.0, 12.0, 8.0, 9.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.55029296875, -0.5353240966796875, -0.520355224609375, -0.5053863525390625, -0.49041748046875, -0.4754486083984375, -0.460479736328125, -0.4455108642578125, -0.4305419921875, -0.4155731201171875, -0.400604248046875, -0.3856353759765625, -0.37066650390625, -0.3556976318359375, -0.340728759765625, -0.3257598876953125, -0.310791015625, -0.2958221435546875, -0.280853271484375, -0.2658843994140625, -0.25091552734375, -0.2359466552734375, -0.220977783203125, -0.2060089111328125, -0.1910400390625, -0.1760711669921875, -0.161102294921875, -0.1461334228515625, -0.13116455078125, -0.1161956787109375, -0.101226806640625, -0.0862579345703125, -0.0712890625, -0.0563201904296875, -0.041351318359375, -0.0263824462890625, -0.01141357421875, 0.0035552978515625, 0.018524169921875, 0.0334930419921875, 0.0484619140625, 0.0634307861328125, 0.078399658203125, 0.0933685302734375, 0.10833740234375, 0.1233062744140625, 0.138275146484375, 0.1532440185546875, 0.168212890625, 0.1831817626953125, 0.198150634765625, 0.2131195068359375, 0.22808837890625, 0.2430572509765625, 0.258026123046875, 0.2729949951171875, 0.2879638671875, 0.3029327392578125, 0.317901611328125, 0.3328704833984375, 0.34783935546875, 0.3628082275390625, 0.377777099609375, 0.3927459716796875, 0.40771484375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 6.0, 2.0, 4.0, 6.0, 12.0, 12.0, 35.0, 46.0, 56.0, 126.0, 232.0, 657.0, 2711.0, 23682.0, 3856970.0, 297438.0, 9935.0, 1478.0, 403.0, 176.0, 112.0, 56.0, 43.0, 31.0, 34.0, 8.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.42578125, -5.17718505859375, -4.9285888671875, -4.67999267578125, -4.431396484375, -4.18280029296875, -3.9342041015625, -3.68560791015625, -3.43701171875, -3.18841552734375, -2.9398193359375, -2.69122314453125, -2.442626953125, -2.19403076171875, -1.9454345703125, -1.69683837890625, -1.4482421875, -1.19964599609375, -0.9510498046875, -0.70245361328125, -0.453857421875, -0.20526123046875, 0.0433349609375, 0.29193115234375, 0.54052734375, 0.78912353515625, 1.0377197265625, 1.28631591796875, 1.534912109375, 1.78350830078125, 2.0321044921875, 2.28070068359375, 2.529296875, 2.77789306640625, 3.0264892578125, 3.27508544921875, 3.523681640625, 3.77227783203125, 4.0208740234375, 4.26947021484375, 4.51806640625, 4.76666259765625, 5.0152587890625, 5.26385498046875, 5.512451171875, 5.76104736328125, 6.0096435546875, 6.25823974609375, 6.5068359375, 6.75543212890625, 7.0040283203125, 7.25262451171875, 7.501220703125, 7.74981689453125, 7.9984130859375, 8.24700927734375, 8.49560546875, 8.74420166015625, 8.9927978515625, 9.24139404296875, 9.489990234375, 9.73858642578125, 9.9871826171875, 10.23577880859375, 10.484375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 6.0, 4.0, 4.0, 9.0, 9.0, 9.0, 19.0, 28.0, 36.0, 62.0, 68.0, 147.0, 348.0, 1751.0, 915.0, 263.0, 132.0, 76.0, 42.0, 41.0, 25.0, 21.0, 17.0, 10.0, 5.0, 6.0, 5.0, 1.0, 5.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.7177734375, -0.6959381103515625, -0.674102783203125, -0.6522674560546875, -0.63043212890625, -0.6085968017578125, -0.586761474609375, -0.5649261474609375, -0.5430908203125, -0.5212554931640625, -0.499420166015625, -0.4775848388671875, -0.45574951171875, -0.4339141845703125, -0.412078857421875, -0.3902435302734375, -0.368408203125, -0.3465728759765625, -0.324737548828125, -0.3029022216796875, -0.28106689453125, -0.2592315673828125, -0.237396240234375, -0.2155609130859375, -0.1937255859375, -0.1718902587890625, -0.150054931640625, -0.1282196044921875, -0.10638427734375, -0.0845489501953125, -0.062713623046875, -0.0408782958984375, -0.01904296875, 0.0027923583984375, 0.024627685546875, 0.0464630126953125, 0.06829833984375, 0.0901336669921875, 0.111968994140625, 0.1338043212890625, 0.1556396484375, 0.1774749755859375, 0.199310302734375, 0.2211456298828125, 0.24298095703125, 0.2648162841796875, 0.286651611328125, 0.3084869384765625, 0.330322265625, 0.3521575927734375, 0.373992919921875, 0.3958282470703125, 0.41766357421875, 0.4394989013671875, 0.461334228515625, 0.4831695556640625, 0.5050048828125, 0.5268402099609375, 0.548675537109375, 0.5705108642578125, 0.59234619140625, 0.6141815185546875, 0.636016845703125, 0.6578521728515625, 0.6796875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 16.0, 98.0, 535.0, 302.0, 44.0, 12.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.450634002685547, -20.897205352783203, -20.34377670288086, -19.790348052978516, -19.236919403076172, -18.683490753173828, -18.130062103271484, -17.57663345336914, -17.023204803466797, -16.469776153564453, -15.91634750366211, -15.362918853759766, -14.809490203857422, -14.256061553955078, -13.702632904052734, -13.14920425415039, -12.59577465057373, -12.042346000671387, -11.488917350769043, -10.9354887008667, -10.382060050964355, -9.828631401062012, -9.275201797485352, -8.721773147583008, -8.168344497680664, -7.61491584777832, -7.061487197875977, -6.508058547973633, -5.954629898071289, -5.401201248168945, -4.847772121429443, -4.2943434715271, -3.740915298461914, -3.1874866485595703, -2.6340579986572266, -2.0806291103363037, -1.52720046043396, -0.9737718105316162, -0.42034292221069336, 0.1330857276916504, 0.6865143775939941, 1.239943027496338, 1.7933717966079712, 2.3468005657196045, 2.9002292156219482, 3.453657865524292, 4.007086753845215, 4.560515403747559, 5.113944053649902, 5.667372703552246, 6.22080135345459, 6.774230003356934, 7.327658653259277, 7.881087303161621, 8.434516906738281, 8.987945556640625, 9.541374206542969, 10.094802856445312, 10.648231506347656, 11.20166015625, 11.755088806152344, 12.308517456054688, 12.861946105957031, 13.415374755859375, 13.968803405761719]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 11.0, 14.0, 18.0, 20.0, 28.0, 34.0, 47.0, 55.0, 54.0, 61.0, 71.0, 62.0, 60.0, 71.0, 66.0, 54.0, 50.0, 55.0, 39.0, 24.0, 26.0, 24.0, 20.0, 11.0, 11.0, 7.0, 4.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.167453289031982, -4.066217422485352, -3.9649815559387207, -3.86374568939209, -3.76250958442688, -3.661273717880249, -3.560037851333618, -3.4588019847869873, -3.3575661182403564, -3.2563302516937256, -3.1550943851470947, -3.0538582801818848, -2.952622413635254, -2.851386547088623, -2.750150680541992, -2.6489148139953613, -2.5476789474487305, -2.4464430809020996, -2.3452072143554688, -2.243971347808838, -2.142735242843628, -2.041499376296997, -1.9402635097503662, -1.8390276432037354, -1.7377915382385254, -1.6365556716918945, -1.5353196859359741, -1.4340838193893433, -1.3328479528427124, -1.231611967086792, -1.1303761005401611, -1.0291402339935303, -0.9279043674468994, -0.8266684412956238, -0.7254325747489929, -0.6241966485977173, -0.5229607820510864, -0.4217248558998108, -0.32048892974853516, -0.2192530632019043, -0.11801713705062866, -0.016781233251094818, 0.08445467054843903, 0.18569058179855347, 0.2869264781475067, 0.38816237449645996, 0.4893983006477356, 0.5906341671943665, 0.6918700933456421, 0.7931060194969177, 0.8943418860435486, 0.9955778121948242, 1.096813678741455, 1.198049545288086, 1.2992855310440063, 1.4005213975906372, 1.5017573833465576, 1.6029932498931885, 1.7042292356491089, 1.8054651021957397, 1.9067009687423706, 2.007936954498291, 2.109172821044922, 2.2104086875915527, 2.3116445541381836]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 2.0, 7.0, 2.0, 10.0, 8.0, 8.0, 7.0, 12.0, 22.0, 37.0, 34.0, 45.0, 55.0, 73.0, 101.0, 153.0, 206.0, 309.0, 478.0, 747.0, 1253.0, 2759.0, 7521.0, 32104.0, 267888.0, 631366.0, 80394.0, 13965.0, 4194.0, 1904.0, 942.0, 606.0, 363.0, 259.0, 192.0, 135.0, 97.0, 81.0, 49.0, 34.0, 29.0, 31.0, 22.0, 16.0, 5.0, 12.0, 6.0, 1.0, 7.0, 1.0, 6.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.8671875, -2.769134521484375, -2.67108154296875, -2.573028564453125, -2.4749755859375, -2.376922607421875, -2.27886962890625, -2.180816650390625, -2.082763671875, -1.984710693359375, -1.88665771484375, -1.788604736328125, -1.6905517578125, -1.592498779296875, -1.49444580078125, -1.396392822265625, -1.29833984375, -1.200286865234375, -1.10223388671875, -1.004180908203125, -0.9061279296875, -0.808074951171875, -0.71002197265625, -0.611968994140625, -0.513916015625, -0.415863037109375, -0.31781005859375, -0.219757080078125, -0.1217041015625, -0.023651123046875, 0.07440185546875, 0.172454833984375, 0.2705078125, 0.368560791015625, 0.46661376953125, 0.564666748046875, 0.6627197265625, 0.760772705078125, 0.85882568359375, 0.956878662109375, 1.054931640625, 1.152984619140625, 1.25103759765625, 1.349090576171875, 1.4471435546875, 1.545196533203125, 1.64324951171875, 1.741302490234375, 1.83935546875, 1.937408447265625, 2.03546142578125, 2.133514404296875, 2.2315673828125, 2.329620361328125, 2.42767333984375, 2.525726318359375, 2.623779296875, 2.721832275390625, 2.81988525390625, 2.917938232421875, 3.0159912109375, 3.114044189453125, 3.21209716796875, 3.310150146484375, 3.408203125]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 5.0, 15.0, 28.0, 72.0, 87.0, 117.0, 158.0, 172.0, 130.0, 95.0, 49.0, 37.0, 15.0, 6.0, 6.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.59375, -0.5757675170898438, -0.5577850341796875, -0.5398025512695312, -0.521820068359375, -0.5038375854492188, -0.4858551025390625, -0.46787261962890625, -0.44989013671875, -0.43190765380859375, -0.4139251708984375, -0.39594268798828125, -0.377960205078125, -0.35997772216796875, -0.3419952392578125, -0.32401275634765625, -0.3060302734375, -0.28804779052734375, -0.2700653076171875, -0.25208282470703125, -0.234100341796875, -0.21611785888671875, -0.1981353759765625, -0.18015289306640625, -0.16217041015625, -0.14418792724609375, -0.1262054443359375, -0.10822296142578125, -0.090240478515625, -0.07225799560546875, -0.0542755126953125, -0.03629302978515625, -0.018310546875, -0.00032806396484375, 0.0176544189453125, 0.03563690185546875, 0.053619384765625, 0.07160186767578125, 0.0895843505859375, 0.10756683349609375, 0.12554931640625, 0.14353179931640625, 0.1615142822265625, 0.17949676513671875, 0.197479248046875, 0.21546173095703125, 0.2334442138671875, 0.25142669677734375, 0.2694091796875, 0.28739166259765625, 0.3053741455078125, 0.32335662841796875, 0.341339111328125, 0.35932159423828125, 0.3773040771484375, 0.39528656005859375, 0.41326904296875, 0.43125152587890625, 0.4492340087890625, 0.46721649169921875, 0.485198974609375, 0.5031814575195312, 0.5211639404296875, 0.5391464233398438, 0.55712890625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 2.0, 3.0, 2.0, 5.0, 6.0, 7.0, 10.0, 9.0, 10.0, 16.0, 27.0, 33.0, 44.0, 66.0, 108.0, 157.0, 265.0, 475.0, 851.0, 1645.0, 3416.0, 8335.0, 27350.0, 140322.0, 625875.0, 187232.0, 34374.0, 9788.0, 3887.0, 1889.0, 943.0, 552.0, 301.0, 215.0, 107.0, 72.0, 47.0, 30.0, 13.0, 14.0, 14.0, 11.0, 12.0, 8.0, 7.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.06640625, -1.991455078125, -1.91650390625, -1.841552734375, -1.7666015625, -1.691650390625, -1.61669921875, -1.541748046875, -1.466796875, -1.391845703125, -1.31689453125, -1.241943359375, -1.1669921875, -1.092041015625, -1.01708984375, -0.942138671875, -0.8671875, -0.792236328125, -0.71728515625, -0.642333984375, -0.5673828125, -0.492431640625, -0.41748046875, -0.342529296875, -0.267578125, -0.192626953125, -0.11767578125, -0.042724609375, 0.0322265625, 0.107177734375, 0.18212890625, 0.257080078125, 0.33203125, 0.406982421875, 0.48193359375, 0.556884765625, 0.6318359375, 0.706787109375, 0.78173828125, 0.856689453125, 0.931640625, 1.006591796875, 1.08154296875, 1.156494140625, 1.2314453125, 1.306396484375, 1.38134765625, 1.456298828125, 1.53125, 1.606201171875, 1.68115234375, 1.756103515625, 1.8310546875, 1.906005859375, 1.98095703125, 2.055908203125, 2.130859375, 2.205810546875, 2.28076171875, 2.355712890625, 2.4306640625, 2.505615234375, 2.58056640625, 2.655517578125, 2.73046875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 0.0, 5.0, 2.0, 5.0, 4.0, 4.0, 6.0, 8.0, 23.0, 22.0, 29.0, 37.0, 62.0, 58.0, 77.0, 63.0, 93.0, 76.0, 89.0, 77.0, 57.0, 51.0, 41.0, 22.0, 25.0, 19.0, 21.0, 8.0, 5.0, 1.0, 3.0, 3.0, 1.0, 2.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.802734375, -1.7398681640625, -1.677001953125, -1.6141357421875, -1.55126953125, -1.4884033203125, -1.425537109375, -1.3626708984375, -1.2998046875, -1.2369384765625, -1.174072265625, -1.1112060546875, -1.04833984375, -0.9854736328125, -0.922607421875, -0.8597412109375, -0.796875, -0.7340087890625, -0.671142578125, -0.6082763671875, -0.54541015625, -0.4825439453125, -0.419677734375, -0.3568115234375, -0.2939453125, -0.2310791015625, -0.168212890625, -0.1053466796875, -0.04248046875, 0.0203857421875, 0.083251953125, 0.1461181640625, 0.208984375, 0.2718505859375, 0.334716796875, 0.3975830078125, 0.46044921875, 0.5233154296875, 0.586181640625, 0.6490478515625, 0.7119140625, 0.7747802734375, 0.837646484375, 0.9005126953125, 0.96337890625, 1.0262451171875, 1.089111328125, 1.1519775390625, 1.21484375, 1.2777099609375, 1.340576171875, 1.4034423828125, 1.46630859375, 1.5291748046875, 1.592041015625, 1.6549072265625, 1.7177734375, 1.7806396484375, 1.843505859375, 1.9063720703125, 1.96923828125, 2.0321044921875, 2.094970703125, 2.1578369140625, 2.220703125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 5.0, 2.0, 11.0, 8.0, 21.0, 39.0, 53.0, 104.0, 224.0, 580.0, 2558.0, 44667.0, 986779.0, 11330.0, 1345.0, 429.0, 201.0, 95.0, 37.0, 33.0, 9.0, 13.0, 6.0, 6.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.5390625, -6.3590087890625, -6.178955078125, -5.9989013671875, -5.81884765625, -5.6387939453125, -5.458740234375, -5.2786865234375, -5.0986328125, -4.9185791015625, -4.738525390625, -4.5584716796875, -4.37841796875, -4.1983642578125, -4.018310546875, -3.8382568359375, -3.658203125, -3.4781494140625, -3.298095703125, -3.1180419921875, -2.93798828125, -2.7579345703125, -2.577880859375, -2.3978271484375, -2.2177734375, -2.0377197265625, -1.857666015625, -1.6776123046875, -1.49755859375, -1.3175048828125, -1.137451171875, -0.9573974609375, -0.77734375, -0.5972900390625, -0.417236328125, -0.2371826171875, -0.05712890625, 0.1229248046875, 0.302978515625, 0.4830322265625, 0.6630859375, 0.8431396484375, 1.023193359375, 1.2032470703125, 1.38330078125, 1.5633544921875, 1.743408203125, 1.9234619140625, 2.103515625, 2.2835693359375, 2.463623046875, 2.6436767578125, 2.82373046875, 3.0037841796875, 3.183837890625, 3.3638916015625, 3.5439453125, 3.7239990234375, 3.904052734375, 4.0841064453125, 4.26416015625, 4.4442138671875, 4.624267578125, 4.8043212890625, 4.984375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 11.0, 9.0, 14.0, 26.0, 41.0, 40.0, 87.0, 125.0, 192.0, 167.0, 104.0, 73.0, 45.0, 10.0, 10.0, 13.0, 10.0, 7.0, 7.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00024008750915527344, -0.0002327561378479004, -0.00022542476654052734, -0.0002180933952331543, -0.00021076202392578125, -0.0002034306526184082, -0.00019609928131103516, -0.0001887679100036621, -0.00018143653869628906, -0.00017410516738891602, -0.00016677379608154297, -0.00015944242477416992, -0.00015211105346679688, -0.00014477968215942383, -0.00013744831085205078, -0.00013011693954467773, -0.0001227855682373047, -0.00011545419692993164, -0.0001081228256225586, -0.00010079145431518555, -9.34600830078125e-05, -8.612871170043945e-05, -7.87973403930664e-05, -7.146596908569336e-05, -6.413459777832031e-05, -5.6803226470947266e-05, -4.947185516357422e-05, -4.214048385620117e-05, -3.4809112548828125e-05, -2.7477741241455078e-05, -2.014636993408203e-05, -1.2814998626708984e-05, -5.4836273193359375e-06, 1.8477439880371094e-06, 9.179115295410156e-06, 1.6510486602783203e-05, 2.384185791015625e-05, 3.11732292175293e-05, 3.8504600524902344e-05, 4.583597183227539e-05, 5.316734313964844e-05, 6.0498714447021484e-05, 6.783008575439453e-05, 7.516145706176758e-05, 8.249282836914062e-05, 8.982419967651367e-05, 9.715557098388672e-05, 0.00010448694229125977, 0.00011181831359863281, 0.00011914968490600586, 0.0001264810562133789, 0.00013381242752075195, 0.000141143798828125, 0.00014847517013549805, 0.0001558065414428711, 0.00016313791275024414, 0.0001704692840576172, 0.00017780065536499023, 0.00018513202667236328, 0.00019246339797973633, 0.00019979476928710938, 0.00020712614059448242, 0.00021445751190185547, 0.00022178888320922852, 0.00022912025451660156]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 12.0, 8.0, 6.0, 10.0, 22.0, 17.0, 39.0, 68.0, 126.0, 156.0, 322.0, 515.0, 1123.0, 2485.0, 6937.0, 27671.0, 400651.0, 559262.0, 35523.0, 8122.0, 2882.0, 1236.0, 565.0, 292.0, 173.0, 113.0, 63.0, 41.0, 34.0, 19.0, 10.0, 16.0, 7.0, 4.0, 7.0, 6.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.8662109375, -1.811431884765625, -1.75665283203125, -1.701873779296875, -1.6470947265625, -1.592315673828125, -1.53753662109375, -1.482757568359375, -1.427978515625, -1.373199462890625, -1.31842041015625, -1.263641357421875, -1.2088623046875, -1.154083251953125, -1.09930419921875, -1.044525146484375, -0.98974609375, -0.934967041015625, -0.88018798828125, -0.825408935546875, -0.7706298828125, -0.715850830078125, -0.66107177734375, -0.606292724609375, -0.551513671875, -0.496734619140625, -0.44195556640625, -0.387176513671875, -0.3323974609375, -0.277618408203125, -0.22283935546875, -0.168060302734375, -0.11328125, -0.058502197265625, -0.00372314453125, 0.051055908203125, 0.1058349609375, 0.160614013671875, 0.21539306640625, 0.270172119140625, 0.324951171875, 0.379730224609375, 0.43450927734375, 0.489288330078125, 0.5440673828125, 0.598846435546875, 0.65362548828125, 0.708404541015625, 0.76318359375, 0.817962646484375, 0.87274169921875, 0.927520751953125, 0.9822998046875, 1.037078857421875, 1.09185791015625, 1.146636962890625, 1.201416015625, 1.256195068359375, 1.31097412109375, 1.365753173828125, 1.4205322265625, 1.475311279296875, 1.53009033203125, 1.584869384765625, 1.6396484375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 1.0, 6.0, 13.0, 17.0, 26.0, 68.0, 141.0, 223.0, 221.0, 126.0, 69.0, 41.0, 17.0, 8.0, 4.0, 4.0, 2.0, 2.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3837890625, -1.3406219482421875, -1.297454833984375, -1.2542877197265625, -1.21112060546875, -1.1679534912109375, -1.124786376953125, -1.0816192626953125, -1.0384521484375, -0.9952850341796875, -0.952117919921875, -0.9089508056640625, -0.86578369140625, -0.8226165771484375, -0.779449462890625, -0.7362823486328125, -0.693115234375, -0.6499481201171875, -0.606781005859375, -0.5636138916015625, -0.52044677734375, -0.4772796630859375, -0.434112548828125, -0.3909454345703125, -0.3477783203125, -0.3046112060546875, -0.261444091796875, -0.2182769775390625, -0.17510986328125, -0.1319427490234375, -0.088775634765625, -0.0456085205078125, -0.00244140625, 0.0407257080078125, 0.083892822265625, 0.1270599365234375, 0.17022705078125, 0.2133941650390625, 0.256561279296875, 0.2997283935546875, 0.3428955078125, 0.3860626220703125, 0.429229736328125, 0.4723968505859375, 0.51556396484375, 0.5587310791015625, 0.601898193359375, 0.6450653076171875, 0.688232421875, 0.7313995361328125, 0.774566650390625, 0.8177337646484375, 0.86090087890625, 0.9040679931640625, 0.947235107421875, 0.9904022216796875, 1.0335693359375, 1.0767364501953125, 1.119903564453125, 1.1630706787109375, 1.20623779296875, 1.2494049072265625, 1.292572021484375, 1.3357391357421875, 1.37890625]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 6.0, 4.0, 8.0, 17.0, 24.0, 37.0, 55.0, 140.0, 203.0, 212.0, 143.0, 73.0, 31.0, 23.0, 8.0, 9.0, 6.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.99288558959961, -16.475082397460938, -15.95727825164795, -15.439474105834961, -14.921669960021973, -14.403865814208984, -13.886062622070312, -13.368258476257324, -12.850454330444336, -12.332650184631348, -11.814846992492676, -11.297042846679688, -10.7792387008667, -10.261434555053711, -9.743631362915039, -9.22582721710205, -8.708024024963379, -8.19021987915039, -7.6724162101745605, -7.1546125411987305, -6.636808395385742, -6.119004726409912, -5.601201057434082, -5.083396911621094, -4.565593242645264, -4.047789573669434, -3.5299854278564453, -3.0121817588806152, -2.494377851486206, -1.9765739440917969, -1.4587702751159668, -0.9409663677215576, -0.42316246032714844, 0.09464138746261597, 0.6124452352523804, 1.1302490234375, 1.6480529308319092, 2.1658568382263184, 2.6836605072021484, 3.2014644145965576, 3.719268321990967, 4.237071990966797, 4.754876136779785, 5.272679805755615, 5.790483474731445, 6.308287620544434, 6.826091289520264, 7.343894958496094, 7.861699104309082, 8.37950325012207, 8.897306442260742, 9.41511058807373, 9.932914733886719, 10.45071792602539, 10.968522071838379, 11.486326217651367, 12.004129409790039, 12.521933555603027, 13.0397367477417, 13.557540893554688, 14.075345039367676, 14.593149185180664, 15.110952377319336, 15.628756523132324, 16.146560668945312]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 3.0, 6.0, 5.0, 7.0, 9.0, 16.0, 23.0, 19.0, 32.0, 39.0, 42.0, 60.0, 52.0, 55.0, 76.0, 71.0, 86.0, 53.0, 51.0, 60.0, 37.0, 33.0, 37.0, 26.0, 25.0, 18.0, 12.0, 14.0, 11.0, 10.0, 6.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-14.542821884155273, -14.108731269836426, -13.674640655517578, -13.24055004119873, -12.806459426879883, -12.372369766235352, -11.938279151916504, -11.504188537597656, -11.070097923278809, -10.636007308959961, -10.201916694641113, -9.767826080322266, -9.333736419677734, -8.89964485168457, -8.465555191040039, -8.031464576721191, -7.597373962402344, -7.163283348083496, -6.729192733764648, -6.295102596282959, -5.861011981964111, -5.426921367645264, -4.992831230163574, -4.558740615844727, -4.124650001525879, -3.6905593872070312, -3.2564690113067627, -2.822378635406494, -2.3882880210876465, -1.9541974067687988, -1.5201070308685303, -1.0860166549682617, -0.6519260406494141, -0.21783554553985596, 0.21625494956970215, 0.6503454446792603, 1.0844359397888184, 1.518526554107666, 1.9526169300079346, 2.386707305908203, 2.820797920227051, 3.2548885345458984, 3.688978910446167, 4.1230692863464355, 4.557159900665283, 4.991250514984131, 5.42534065246582, 5.859431266784668, 6.293521881103516, 6.727612495422363, 7.161703109741211, 7.5957932472229, 8.029884338378906, 8.463973999023438, 8.898064613342285, 9.332155227661133, 9.76624584197998, 10.200336456298828, 10.634427070617676, 11.068517684936523, 11.502607345581055, 11.936698913574219, 12.37078857421875, 12.804879188537598, 13.238969802856445]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 5.0, 4.0, 5.0, 12.0, 5.0, 11.0, 7.0, 11.0, 18.0, 24.0, 24.0, 32.0, 42.0, 51.0, 71.0, 78.0, 104.0, 144.0, 195.0, 262.0, 361.0, 552.0, 838.0, 1502.0, 2551.0, 5224.0, 11179.0, 28399.0, 107046.0, 3193786.0, 723786.0, 75447.0, 22802.0, 9428.0, 4444.0, 2390.0, 1266.0, 739.0, 495.0, 299.0, 219.0, 135.0, 101.0, 56.0, 38.0, 35.0, 33.0, 8.0, 11.0, 4.0, 6.0, 4.0, 1.0, 2.0, 1.0], "bins": [-3.189453125, -3.107421875, -3.025390625, -2.943359375, -2.861328125, -2.779296875, -2.697265625, -2.615234375, -2.533203125, -2.451171875, -2.369140625, -2.287109375, -2.205078125, -2.123046875, -2.041015625, -1.958984375, -1.876953125, -1.794921875, -1.712890625, -1.630859375, -1.548828125, -1.466796875, -1.384765625, -1.302734375, -1.220703125, -1.138671875, -1.056640625, -0.974609375, -0.892578125, -0.810546875, -0.728515625, -0.646484375, -0.564453125, -0.482421875, -0.400390625, -0.318359375, -0.236328125, -0.154296875, -0.072265625, 0.009765625, 0.091796875, 0.173828125, 0.255859375, 0.337890625, 0.419921875, 0.501953125, 0.583984375, 0.666015625, 0.748046875, 0.830078125, 0.912109375, 0.994140625, 1.076171875, 1.158203125, 1.240234375, 1.322265625, 1.404296875, 1.486328125, 1.568359375, 1.650390625, 1.732421875, 1.814453125, 1.896484375, 1.978515625, 2.060546875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 6.0, 8.0, 10.0, 13.0, 22.0, 33.0, 49.0, 60.0, 84.0, 69.0, 77.0, 100.0, 93.0, 61.0, 61.0, 66.0, 43.0, 42.0, 39.0, 15.0, 10.0, 10.0, 7.0, 7.0, 1.0, 3.0, 2.0, 0.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.529296875, -0.5162696838378906, -0.5032424926757812, -0.4902153015136719, -0.4771881103515625, -0.4641609191894531, -0.45113372802734375, -0.4381065368652344, -0.425079345703125, -0.4120521545410156, -0.39902496337890625, -0.3859977722167969, -0.3729705810546875, -0.3599433898925781, -0.34691619873046875, -0.3338890075683594, -0.32086181640625, -0.3078346252441406, -0.29480743408203125, -0.2817802429199219, -0.2687530517578125, -0.2557258605957031, -0.24269866943359375, -0.22967147827148438, -0.216644287109375, -0.20361709594726562, -0.19058990478515625, -0.17756271362304688, -0.1645355224609375, -0.15150833129882812, -0.13848114013671875, -0.12545394897460938, -0.1124267578125, -0.09939956665039062, -0.08637237548828125, -0.07334518432617188, -0.0603179931640625, -0.047290802001953125, -0.03426361083984375, -0.021236419677734375, -0.008209228515625, 0.004817962646484375, 0.01784515380859375, 0.030872344970703125, 0.0438995361328125, 0.056926727294921875, 0.06995391845703125, 0.08298110961914062, 0.09600830078125, 0.10903549194335938, 0.12206268310546875, 0.13508987426757812, 0.1481170654296875, 0.16114425659179688, 0.17417144775390625, 0.18719863891601562, 0.200225830078125, 0.21325302124023438, 0.22628021240234375, 0.23930740356445312, 0.2523345947265625, 0.2653617858886719, 0.27838897705078125, 0.2914161682128906, 0.304443359375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 3.0, 5.0, 10.0, 12.0, 14.0, 24.0, 46.0, 82.0, 128.0, 248.0, 518.0, 1246.0, 3289.0, 13288.0, 154921.0, 3921132.0, 83921.0, 10237.0, 2893.0, 1161.0, 490.0, 263.0, 131.0, 78.0, 58.0, 30.0, 15.0, 7.0, 2.0, 6.0, 2.0, 8.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0], "bins": [-4.5, -4.36529541015625, -4.2305908203125, -4.09588623046875, -3.961181640625, -3.82647705078125, -3.6917724609375, -3.55706787109375, -3.42236328125, -3.28765869140625, -3.1529541015625, -3.01824951171875, -2.883544921875, -2.74884033203125, -2.6141357421875, -2.47943115234375, -2.3447265625, -2.21002197265625, -2.0753173828125, -1.94061279296875, -1.805908203125, -1.67120361328125, -1.5364990234375, -1.40179443359375, -1.26708984375, -1.13238525390625, -0.9976806640625, -0.86297607421875, -0.728271484375, -0.59356689453125, -0.4588623046875, -0.32415771484375, -0.189453125, -0.05474853515625, 0.0799560546875, 0.21466064453125, 0.349365234375, 0.48406982421875, 0.6187744140625, 0.75347900390625, 0.88818359375, 1.02288818359375, 1.1575927734375, 1.29229736328125, 1.427001953125, 1.56170654296875, 1.6964111328125, 1.83111572265625, 1.9658203125, 2.10052490234375, 2.2352294921875, 2.36993408203125, 2.504638671875, 2.63934326171875, 2.7740478515625, 2.90875244140625, 3.04345703125, 3.17816162109375, 3.3128662109375, 3.44757080078125, 3.582275390625, 3.71697998046875, 3.8516845703125, 3.98638916015625, 4.12109375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 2.0, 4.0, 9.0, 12.0, 16.0, 21.0, 39.0, 58.0, 100.0, 176.0, 469.0, 2117.0, 570.0, 194.0, 85.0, 67.0, 36.0, 39.0, 15.0, 7.0, 7.0, 7.0, 2.0, 7.0, 6.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.61572265625, -0.5925521850585938, -0.5693817138671875, -0.5462112426757812, -0.523040771484375, -0.49987030029296875, -0.4766998291015625, -0.45352935791015625, -0.43035888671875, -0.40718841552734375, -0.3840179443359375, -0.36084747314453125, -0.337677001953125, -0.31450653076171875, -0.2913360595703125, -0.26816558837890625, -0.2449951171875, -0.22182464599609375, -0.1986541748046875, -0.17548370361328125, -0.152313232421875, -0.12914276123046875, -0.1059722900390625, -0.08280181884765625, -0.05963134765625, -0.03646087646484375, -0.0132904052734375, 0.00988006591796875, 0.033050537109375, 0.05622100830078125, 0.0793914794921875, 0.10256195068359375, 0.125732421875, 0.14890289306640625, 0.1720733642578125, 0.19524383544921875, 0.218414306640625, 0.24158477783203125, 0.2647552490234375, 0.28792572021484375, 0.31109619140625, 0.33426666259765625, 0.3574371337890625, 0.38060760498046875, 0.403778076171875, 0.42694854736328125, 0.4501190185546875, 0.47328948974609375, 0.4964599609375, 0.5196304321289062, 0.5428009033203125, 0.5659713745117188, 0.589141845703125, 0.6123123168945312, 0.6354827880859375, 0.6586532592773438, 0.68182373046875, 0.7049942016601562, 0.7281646728515625, 0.7513351440429688, 0.774505615234375, 0.7976760864257812, 0.8208465576171875, 0.8440170288085938, 0.8671875]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 20.0, 33.0, 128.0, 256.0, 339.0, 139.0, 56.0, 17.0, 13.0, 4.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-10.124211311340332, -9.889419555664062, -9.65462875366211, -9.41983699798584, -9.18504524230957, -8.950254440307617, -8.715462684631348, -8.480670928955078, -8.245880126953125, -8.011088371276855, -7.776297092437744, -7.541505813598633, -7.3067145347595215, -7.07192325592041, -6.837131500244141, -6.602340221405029, -6.36754846572876, -6.132757186889648, -5.897965431213379, -5.663174152374268, -5.428382873535156, -5.193591117858887, -4.958799839019775, -4.724008560180664, -4.4892168045043945, -4.254425525665283, -4.019633769989014, -3.7848424911499023, -3.550051212310791, -3.3152596950531006, -3.08046817779541, -2.845676898956299, -2.6108856201171875, -2.376094102859497, -2.1413028240203857, -1.9065113067626953, -1.6717199087142944, -1.4369285106658936, -1.2021369934082031, -0.9673455953598022, -0.7325541973114014, -0.4977627694606781, -0.26297134160995483, -0.02817988395690918, 0.2066115140914917, 0.4414029121398926, 0.676194429397583, 0.9109858274459839, 1.1457772254943848, 1.3805686235427856, 1.6153600215911865, 1.850151538848877, 2.0849428176879883, 2.3197343349456787, 2.554525852203369, 2.7893171310424805, 3.024108648300171, 3.2589001655578613, 3.4936914443969727, 3.728482961654663, 3.9632744789123535, 4.198065757751465, 4.432857513427734, 4.667648792266846, 4.902440071105957]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 4.0, 6.0, 7.0, 9.0, 16.0, 20.0, 18.0, 31.0, 45.0, 52.0, 54.0, 44.0, 60.0, 70.0, 65.0, 60.0, 63.0, 54.0, 56.0, 58.0, 43.0, 35.0, 27.0, 24.0, 20.0, 20.0, 13.0, 9.0, 4.0, 4.0, 4.0, 2.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1959757804870605, -2.1162328720092773, -2.036489963531494, -1.9567471742630005, -1.8770042657852173, -1.797261357307434, -1.7175185680389404, -1.6377756595611572, -1.558032751083374, -1.4782898426055908, -1.3985469341278076, -1.318804144859314, -1.2390612363815308, -1.1593183279037476, -1.079575538635254, -0.9998326301574707, -0.9200897216796875, -0.8403468132019043, -0.7606039643287659, -0.6808611154556274, -0.6011182069778442, -0.521375298500061, -0.4416324496269226, -0.3618896007537842, -0.282146692276001, -0.20240381360054016, -0.12266093492507935, -0.04291805624961853, 0.036824822425842285, 0.1165677011013031, 0.19631057977676392, 0.27605342864990234, 0.35579633712768555, 0.43553921580314636, 0.5152820944786072, 0.5950249433517456, 0.6747678518295288, 0.754510760307312, 0.8342536091804504, 0.9139964580535889, 0.9937393665313721, 1.0734822750091553, 1.1532251834869385, 1.2329679727554321, 1.3127108812332153, 1.3924537897109985, 1.4721965789794922, 1.5519394874572754, 1.6316823959350586, 1.7114253044128418, 1.791168212890625, 1.8709110021591187, 1.9506539106369019, 2.0303966999053955, 2.1101396083831787, 2.189882516860962, 2.269625425338745, 2.3493683338165283, 2.4291112422943115, 2.5088541507720947, 2.588596820831299, 2.668339729309082, 2.7480826377868652, 2.8278255462646484, 2.9075684547424316]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 10.0, 10.0, 10.0, 17.0, 20.0, 27.0, 38.0, 55.0, 87.0, 115.0, 214.0, 306.0, 467.0, 879.0, 1536.0, 2904.0, 6466.0, 17007.0, 56175.0, 246303.0, 509209.0, 147731.0, 36676.0, 12047.0, 4826.0, 2328.0, 1165.0, 729.0, 424.0, 259.0, 157.0, 114.0, 64.0, 52.0, 41.0, 31.0, 23.0, 9.0, 6.0, 7.0, 6.0, 3.0, 3.0, 4.0, 1.0, 2.0], "bins": [-2.5, -2.434783935546875, -2.36956787109375, -2.304351806640625, -2.2391357421875, -2.173919677734375, -2.10870361328125, -2.043487548828125, -1.978271484375, -1.913055419921875, -1.84783935546875, -1.782623291015625, -1.7174072265625, -1.652191162109375, -1.58697509765625, -1.521759033203125, -1.45654296875, -1.391326904296875, -1.32611083984375, -1.260894775390625, -1.1956787109375, -1.130462646484375, -1.06524658203125, -1.000030517578125, -0.934814453125, -0.869598388671875, -0.80438232421875, -0.739166259765625, -0.6739501953125, -0.608734130859375, -0.54351806640625, -0.478302001953125, -0.4130859375, -0.347869873046875, -0.28265380859375, -0.217437744140625, -0.1522216796875, -0.087005615234375, -0.02178955078125, 0.043426513671875, 0.108642578125, 0.173858642578125, 0.23907470703125, 0.304290771484375, 0.3695068359375, 0.434722900390625, 0.49993896484375, 0.565155029296875, 0.63037109375, 0.695587158203125, 0.76080322265625, 0.826019287109375, 0.8912353515625, 0.956451416015625, 1.02166748046875, 1.086883544921875, 1.152099609375, 1.217315673828125, 1.28253173828125, 1.347747802734375, 1.4129638671875, 1.478179931640625, 1.54339599609375, 1.608612060546875, 1.673828125]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 5.0, 3.0, 3.0, 2.0, 4.0, 4.0, 14.0, 16.0, 20.0, 36.0, 61.0, 74.0, 88.0, 96.0, 94.0, 107.0, 77.0, 77.0, 65.0, 41.0, 37.0, 21.0, 23.0, 13.0, 7.0, 3.0, 6.0, 2.0, 2.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58837890625, -0.5732498168945312, -0.5581207275390625, -0.5429916381835938, -0.527862548828125, -0.5127334594726562, -0.4976043701171875, -0.48247528076171875, -0.46734619140625, -0.45221710205078125, -0.4370880126953125, -0.42195892333984375, -0.406829833984375, -0.39170074462890625, -0.3765716552734375, -0.36144256591796875, -0.3463134765625, -0.33118438720703125, -0.3160552978515625, -0.30092620849609375, -0.285797119140625, -0.27066802978515625, -0.2555389404296875, -0.24040985107421875, -0.22528076171875, -0.21015167236328125, -0.1950225830078125, -0.17989349365234375, -0.164764404296875, -0.14963531494140625, -0.1345062255859375, -0.11937713623046875, -0.104248046875, -0.08911895751953125, -0.0739898681640625, -0.05886077880859375, -0.043731689453125, -0.02860260009765625, -0.0134735107421875, 0.00165557861328125, 0.01678466796875, 0.03191375732421875, 0.0470428466796875, 0.06217193603515625, 0.077301025390625, 0.09243011474609375, 0.1075592041015625, 0.12268829345703125, 0.1378173828125, 0.15294647216796875, 0.1680755615234375, 0.18320465087890625, 0.198333740234375, 0.21346282958984375, 0.2285919189453125, 0.24372100830078125, 0.25885009765625, 0.27397918701171875, 0.2891082763671875, 0.30423736572265625, 0.319366455078125, 0.33449554443359375, 0.3496246337890625, 0.36475372314453125, 0.3798828125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 1.0, 1.0, 7.0, 4.0, 8.0, 19.0, 12.0, 33.0, 34.0, 40.0, 70.0, 94.0, 118.0, 207.0, 299.0, 620.0, 1082.0, 2035.0, 3976.0, 8658.0, 22841.0, 76346.0, 338952.0, 438871.0, 104457.0, 29264.0, 10598.0, 4633.0, 2320.0, 1199.0, 672.0, 405.0, 238.0, 137.0, 79.0, 67.0, 36.0, 30.0, 25.0, 27.0, 15.0, 6.0, 6.0, 2.0, 5.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6240234375, -1.5682373046875, -1.512451171875, -1.4566650390625, -1.40087890625, -1.3450927734375, -1.289306640625, -1.2335205078125, -1.177734375, -1.1219482421875, -1.066162109375, -1.0103759765625, -0.95458984375, -0.8988037109375, -0.843017578125, -0.7872314453125, -0.7314453125, -0.6756591796875, -0.619873046875, -0.5640869140625, -0.50830078125, -0.4525146484375, -0.396728515625, -0.3409423828125, -0.28515625, -0.2293701171875, -0.173583984375, -0.1177978515625, -0.06201171875, -0.0062255859375, 0.049560546875, 0.1053466796875, 0.1611328125, 0.2169189453125, 0.272705078125, 0.3284912109375, 0.38427734375, 0.4400634765625, 0.495849609375, 0.5516357421875, 0.607421875, 0.6632080078125, 0.718994140625, 0.7747802734375, 0.83056640625, 0.8863525390625, 0.942138671875, 0.9979248046875, 1.0537109375, 1.1094970703125, 1.165283203125, 1.2210693359375, 1.27685546875, 1.3326416015625, 1.388427734375, 1.4442138671875, 1.5, 1.5557861328125, 1.611572265625, 1.6673583984375, 1.72314453125, 1.7789306640625, 1.834716796875, 1.8905029296875, 1.9462890625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 5.0, 6.0, 3.0, 6.0, 7.0, 14.0, 13.0, 19.0, 27.0, 38.0, 38.0, 47.0, 56.0, 76.0, 74.0, 79.0, 72.0, 73.0, 65.0, 58.0, 45.0, 31.0, 27.0, 27.0, 22.0, 20.0, 7.0, 7.0, 5.0, 7.0, 8.0, 4.0, 3.0, 3.0, 3.0, 5.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.77734375, -1.716552734375, -1.65576171875, -1.594970703125, -1.5341796875, -1.473388671875, -1.41259765625, -1.351806640625, -1.291015625, -1.230224609375, -1.16943359375, -1.108642578125, -1.0478515625, -0.987060546875, -0.92626953125, -0.865478515625, -0.8046875, -0.743896484375, -0.68310546875, -0.622314453125, -0.5615234375, -0.500732421875, -0.43994140625, -0.379150390625, -0.318359375, -0.257568359375, -0.19677734375, -0.135986328125, -0.0751953125, -0.014404296875, 0.04638671875, 0.107177734375, 0.16796875, 0.228759765625, 0.28955078125, 0.350341796875, 0.4111328125, 0.471923828125, 0.53271484375, 0.593505859375, 0.654296875, 0.715087890625, 0.77587890625, 0.836669921875, 0.8974609375, 0.958251953125, 1.01904296875, 1.079833984375, 1.140625, 1.201416015625, 1.26220703125, 1.322998046875, 1.3837890625, 1.444580078125, 1.50537109375, 1.566162109375, 1.626953125, 1.687744140625, 1.74853515625, 1.809326171875, 1.8701171875, 1.930908203125, 1.99169921875, 2.052490234375, 2.11328125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 3.0, 3.0, 1.0, 5.0, 8.0, 7.0, 13.0, 15.0, 21.0, 35.0, 68.0, 80.0, 172.0, 473.0, 1233.0, 4781.0, 30394.0, 711924.0, 279068.0, 15705.0, 2961.0, 887.0, 322.0, 145.0, 82.0, 44.0, 32.0, 18.0, 13.0, 15.0, 12.0, 3.0, 3.0, 3.0, 5.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3388671875, -1.2954559326171875, -1.252044677734375, -1.2086334228515625, -1.16522216796875, -1.1218109130859375, -1.078399658203125, -1.0349884033203125, -0.9915771484375, -0.9481658935546875, -0.904754638671875, -0.8613433837890625, -0.81793212890625, -0.7745208740234375, -0.731109619140625, -0.6876983642578125, -0.644287109375, -0.6008758544921875, -0.557464599609375, -0.5140533447265625, -0.47064208984375, -0.4272308349609375, -0.383819580078125, -0.3404083251953125, -0.2969970703125, -0.2535858154296875, -0.210174560546875, -0.1667633056640625, -0.12335205078125, -0.0799407958984375, -0.036529541015625, 0.0068817138671875, 0.05029296875, 0.0937042236328125, 0.137115478515625, 0.1805267333984375, 0.22393798828125, 0.2673492431640625, 0.310760498046875, 0.3541717529296875, 0.3975830078125, 0.4409942626953125, 0.484405517578125, 0.5278167724609375, 0.57122802734375, 0.6146392822265625, 0.658050537109375, 0.7014617919921875, 0.744873046875, 0.7882843017578125, 0.831695556640625, 0.8751068115234375, 0.91851806640625, 0.9619293212890625, 1.005340576171875, 1.0487518310546875, 1.0921630859375, 1.1355743408203125, 1.178985595703125, 1.2223968505859375, 1.26580810546875, 1.3092193603515625, 1.352630615234375, 1.3960418701171875, 1.439453125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 5.0, 7.0, 10.0, 16.0, 14.0, 12.0, 21.0, 23.0, 30.0, 44.0, 59.0, 59.0, 88.0, 99.0, 110.0, 63.0, 68.0, 66.0, 50.0, 33.0, 25.0, 23.0, 17.0, 6.0, 2.0, 10.0, 8.0, 6.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.071826934814453e-05, -8.77799466252327e-05, -8.484162390232086e-05, -8.190330117940903e-05, -7.896497845649719e-05, -7.602665573358536e-05, -7.308833301067352e-05, -7.015001028776169e-05, -6.721168756484985e-05, -6.427336484193802e-05, -6.133504211902618e-05, -5.839671939611435e-05, -5.5458396673202515e-05, -5.252007395029068e-05, -4.9581751227378845e-05, -4.664342850446701e-05, -4.3705105781555176e-05, -4.076678305864334e-05, -3.7828460335731506e-05, -3.489013761281967e-05, -3.195181488990784e-05, -2.9013492166996002e-05, -2.6075169444084167e-05, -2.3136846721172333e-05, -2.0198523998260498e-05, -1.7260201275348663e-05, -1.4321878552436829e-05, -1.1383555829524994e-05, -8.44523310661316e-06, -5.5069103837013245e-06, -2.5685876607894897e-06, 3.6973506212234497e-07, 3.3080577850341797e-06, 6.246380507946014e-06, 9.184703230857849e-06, 1.2123025953769684e-05, 1.5061348676681519e-05, 1.7999671399593353e-05, 2.0937994122505188e-05, 2.3876316845417023e-05, 2.6814639568328857e-05, 2.9752962291240692e-05, 3.269128501415253e-05, 3.562960773706436e-05, 3.8567930459976196e-05, 4.150625318288803e-05, 4.4444575905799866e-05, 4.73828986287117e-05, 5.0321221351623535e-05, 5.325954407453537e-05, 5.6197866797447205e-05, 5.913618952035904e-05, 6.207451224327087e-05, 6.501283496618271e-05, 6.795115768909454e-05, 7.088948041200638e-05, 7.382780313491821e-05, 7.676612585783005e-05, 7.970444858074188e-05, 8.264277130365372e-05, 8.558109402656555e-05, 8.851941674947739e-05, 9.145773947238922e-05, 9.439606219530106e-05, 9.733438491821289e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 8.0, 7.0, 10.0, 13.0, 21.0, 35.0, 58.0, 83.0, 83.0, 151.0, 258.0, 388.0, 696.0, 1455.0, 2926.0, 7007.0, 19449.0, 80842.0, 544797.0, 321897.0, 44996.0, 13219.0, 5166.0, 2303.0, 1093.0, 563.0, 345.0, 224.0, 139.0, 99.0, 58.0, 46.0, 34.0, 28.0, 24.0, 7.0, 5.0, 8.0, 5.0, 4.0, 0.0, 4.0, 2.0, 1.0, 1.0], "bins": [-0.8017578125, -0.7805633544921875, -0.759368896484375, -0.7381744384765625, -0.71697998046875, -0.6957855224609375, -0.674591064453125, -0.6533966064453125, -0.6322021484375, -0.6110076904296875, -0.589813232421875, -0.5686187744140625, -0.54742431640625, -0.5262298583984375, -0.505035400390625, -0.4838409423828125, -0.462646484375, -0.4414520263671875, -0.420257568359375, -0.3990631103515625, -0.37786865234375, -0.3566741943359375, -0.335479736328125, -0.3142852783203125, -0.2930908203125, -0.2718963623046875, -0.250701904296875, -0.2295074462890625, -0.20831298828125, -0.1871185302734375, -0.165924072265625, -0.1447296142578125, -0.12353515625, -0.1023406982421875, -0.081146240234375, -0.0599517822265625, -0.03875732421875, -0.0175628662109375, 0.003631591796875, 0.0248260498046875, 0.0460205078125, 0.0672149658203125, 0.088409423828125, 0.1096038818359375, 0.13079833984375, 0.1519927978515625, 0.173187255859375, 0.1943817138671875, 0.215576171875, 0.2367706298828125, 0.257965087890625, 0.2791595458984375, 0.30035400390625, 0.3215484619140625, 0.342742919921875, 0.3639373779296875, 0.3851318359375, 0.4063262939453125, 0.427520751953125, 0.4487152099609375, 0.46990966796875, 0.4911041259765625, 0.512298583984375, 0.5334930419921875, 0.5546875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 6.0, 3.0, 8.0, 5.0, 6.0, 16.0, 23.0, 50.0, 74.0, 117.0, 161.0, 145.0, 137.0, 82.0, 63.0, 42.0, 16.0, 10.0, 10.0, 8.0, 6.0, 5.0, 5.0, 4.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8642578125, -0.841064453125, -0.81787109375, -0.794677734375, -0.771484375, -0.748291015625, -0.72509765625, -0.701904296875, -0.6787109375, -0.655517578125, -0.63232421875, -0.609130859375, -0.5859375, -0.562744140625, -0.53955078125, -0.516357421875, -0.4931640625, -0.469970703125, -0.44677734375, -0.423583984375, -0.400390625, -0.377197265625, -0.35400390625, -0.330810546875, -0.3076171875, -0.284423828125, -0.26123046875, -0.238037109375, -0.21484375, -0.191650390625, -0.16845703125, -0.145263671875, -0.1220703125, -0.098876953125, -0.07568359375, -0.052490234375, -0.029296875, -0.006103515625, 0.01708984375, 0.040283203125, 0.0634765625, 0.086669921875, 0.10986328125, 0.133056640625, 0.15625, 0.179443359375, 0.20263671875, 0.225830078125, 0.2490234375, 0.272216796875, 0.29541015625, 0.318603515625, 0.341796875, 0.364990234375, 0.38818359375, 0.411376953125, 0.4345703125, 0.457763671875, 0.48095703125, 0.504150390625, 0.52734375, 0.550537109375, 0.57373046875, 0.596923828125, 0.6201171875]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 9.0, 18.0, 78.0, 240.0, 442.0, 147.0, 51.0, 16.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.11605453491211, -11.13099193572998, -10.145928382873535, -9.160865783691406, -8.175802230834961, -7.190739631652832, -6.205677032470703, -5.220613956451416, -4.235550880432129, -3.250487804412842, -2.265424966812134, -1.2803621292114258, -0.29529905319213867, 0.6897640228271484, 1.6748266220092773, 2.6598896980285645, 3.6449527740478516, 4.630015850067139, 5.615078926086426, 6.600141525268555, 7.585204601287842, 8.570267677307129, 9.555330276489258, 10.540393829345703, 11.525456428527832, 12.510519027709961, 13.495582580566406, 14.480645179748535, 15.465707778930664, 16.45077133178711, 17.435832977294922, 18.420896530151367, 19.405960083007812, 20.391023635864258, 21.37608528137207, 22.361148834228516, 23.34621238708496, 24.331275939941406, 25.31633758544922, 26.301401138305664, 27.28646469116211, 28.271528244018555, 29.256589889526367, 30.241653442382812, 31.226716995239258, 32.2117805480957, 33.196842193603516, 34.18190383911133, 35.166969299316406, 36.15203094482422, 37.1370964050293, 38.12215805053711, 39.10721969604492, 40.09228515625, 41.07734680175781, 42.062408447265625, 43.04747009277344, 44.03253173828125, 45.01759719848633, 46.00265884399414, 46.98772048950195, 47.97278594970703, 48.957847595214844, 49.942909240722656, 50.927974700927734]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 3.0, 8.0, 13.0, 19.0, 21.0, 32.0, 50.0, 61.0, 60.0, 80.0, 81.0, 89.0, 92.0, 76.0, 69.0, 60.0, 49.0, 38.0, 41.0, 23.0, 17.0, 9.0, 6.0, 6.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.135910034179688, -11.665919303894043, -11.195928573608398, -10.725937843322754, -10.25594711303711, -9.785955429077148, -9.315964698791504, -8.84597396850586, -8.375983238220215, -7.90599250793457, -7.436001777648926, -6.966010570526123, -6.4960198402404785, -6.026029109954834, -5.556037902832031, -5.086047172546387, -4.616056442260742, -4.146065711975098, -3.676074743270874, -3.2060837745666504, -2.736093044281006, -2.2661023139953613, -1.7961113452911377, -1.326120376586914, -0.8561296463012695, -0.38613879680633545, 0.08385205268859863, 0.5538429021835327, 1.0238337516784668, 1.4938244819641113, 1.963815450668335, 2.4338064193725586, 2.903797149658203, 3.3737878799438477, 3.8437788486480713, 4.313769817352295, 4.7837605476379395, 5.253751277923584, 5.723742485046387, 6.193733215332031, 6.663723945617676, 7.13371467590332, 7.603705406188965, 8.07369613647461, 8.54368782043457, 9.013677597045898, 9.48366928100586, 9.953660011291504, 10.423650741577148, 10.893641471862793, 11.363632202148438, 11.833622932434082, 12.303613662719727, 12.773605346679688, 13.243596076965332, 13.713586807250977, 14.183577537536621, 14.653568267822266, 15.12355899810791, 15.593549728393555, 16.063541412353516, 16.533531188964844, 17.003522872924805, 17.473514556884766, 17.943504333496094]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 5.0, 11.0, 9.0, 11.0, 15.0, 14.0, 29.0, 22.0, 31.0, 23.0, 56.0, 70.0, 81.0, 124.0, 197.0, 265.0, 403.0, 658.0, 1189.0, 2189.0, 4750.0, 11641.0, 38283.0, 265997.0, 3679933.0, 142909.0, 27409.0, 9295.0, 3829.0, 1894.0, 1046.0, 623.0, 372.0, 255.0, 159.0, 140.0, 92.0, 78.0, 51.0, 40.0, 25.0, 23.0, 11.0, 4.0, 8.0, 2.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0], "bins": [-2.19140625, -2.13116455078125, -2.0709228515625, -2.01068115234375, -1.950439453125, -1.89019775390625, -1.8299560546875, -1.76971435546875, -1.70947265625, -1.64923095703125, -1.5889892578125, -1.52874755859375, -1.468505859375, -1.40826416015625, -1.3480224609375, -1.28778076171875, -1.2275390625, -1.16729736328125, -1.1070556640625, -1.04681396484375, -0.986572265625, -0.92633056640625, -0.8660888671875, -0.80584716796875, -0.74560546875, -0.68536376953125, -0.6251220703125, -0.56488037109375, -0.504638671875, -0.44439697265625, -0.3841552734375, -0.32391357421875, -0.263671875, -0.20343017578125, -0.1431884765625, -0.08294677734375, -0.022705078125, 0.03753662109375, 0.0977783203125, 0.15802001953125, 0.21826171875, 0.27850341796875, 0.3387451171875, 0.39898681640625, 0.459228515625, 0.51947021484375, 0.5797119140625, 0.63995361328125, 0.7001953125, 0.76043701171875, 0.8206787109375, 0.88092041015625, 0.941162109375, 1.00140380859375, 1.0616455078125, 1.12188720703125, 1.18212890625, 1.24237060546875, 1.3026123046875, 1.36285400390625, 1.423095703125, 1.48333740234375, 1.5435791015625, 1.60382080078125, 1.6640625]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 3.0, 8.0, 4.0, 15.0, 15.0, 18.0, 25.0, 45.0, 39.0, 56.0, 78.0, 74.0, 100.0, 81.0, 79.0, 68.0, 63.0, 57.0, 46.0, 33.0, 22.0, 19.0, 14.0, 9.0, 8.0, 7.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0], "bins": [-0.4619140625, -0.449188232421875, -0.43646240234375, -0.423736572265625, -0.4110107421875, -0.398284912109375, -0.38555908203125, -0.372833251953125, -0.360107421875, -0.347381591796875, -0.33465576171875, -0.321929931640625, -0.3092041015625, -0.296478271484375, -0.28375244140625, -0.271026611328125, -0.25830078125, -0.245574951171875, -0.23284912109375, -0.220123291015625, -0.2073974609375, -0.194671630859375, -0.18194580078125, -0.169219970703125, -0.156494140625, -0.143768310546875, -0.13104248046875, -0.118316650390625, -0.1055908203125, -0.092864990234375, -0.08013916015625, -0.067413330078125, -0.0546875, -0.041961669921875, -0.02923583984375, -0.016510009765625, -0.0037841796875, 0.008941650390625, 0.02166748046875, 0.034393310546875, 0.047119140625, 0.059844970703125, 0.07257080078125, 0.085296630859375, 0.0980224609375, 0.110748291015625, 0.12347412109375, 0.136199951171875, 0.14892578125, 0.161651611328125, 0.17437744140625, 0.187103271484375, 0.1998291015625, 0.212554931640625, 0.22528076171875, 0.238006591796875, 0.250732421875, 0.263458251953125, 0.27618408203125, 0.288909912109375, 0.3016357421875, 0.314361572265625, 0.32708740234375, 0.339813232421875, 0.3525390625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 1.0, 3.0, 4.0, 7.0, 13.0, 6.0, 33.0, 46.0, 64.0, 94.0, 168.0, 303.0, 606.0, 1537.0, 5002.0, 27148.0, 816624.0, 3294427.0, 38437.0, 6125.0, 1997.0, 788.0, 385.0, 211.0, 95.0, 58.0, 39.0, 22.0, 15.0, 8.0, 8.0, 7.0, 1.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.359375, -2.26531982421875, -2.1712646484375, -2.07720947265625, -1.983154296875, -1.88909912109375, -1.7950439453125, -1.70098876953125, -1.60693359375, -1.51287841796875, -1.4188232421875, -1.32476806640625, -1.230712890625, -1.13665771484375, -1.0426025390625, -0.94854736328125, -0.8544921875, -0.76043701171875, -0.6663818359375, -0.57232666015625, -0.478271484375, -0.38421630859375, -0.2901611328125, -0.19610595703125, -0.10205078125, -0.00799560546875, 0.0860595703125, 0.18011474609375, 0.274169921875, 0.36822509765625, 0.4622802734375, 0.55633544921875, 0.650390625, 0.74444580078125, 0.8385009765625, 0.93255615234375, 1.026611328125, 1.12066650390625, 1.2147216796875, 1.30877685546875, 1.40283203125, 1.49688720703125, 1.5909423828125, 1.68499755859375, 1.779052734375, 1.87310791015625, 1.9671630859375, 2.06121826171875, 2.1552734375, 2.24932861328125, 2.3433837890625, 2.43743896484375, 2.531494140625, 2.62554931640625, 2.7196044921875, 2.81365966796875, 2.90771484375, 3.00177001953125, 3.0958251953125, 3.18988037109375, 3.283935546875, 3.37799072265625, 3.4720458984375, 3.56610107421875, 3.66015625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 5.0, 7.0, 5.0, 15.0, 30.0, 34.0, 44.0, 82.0, 164.0, 429.0, 2022.0, 739.0, 238.0, 95.0, 63.0, 28.0, 26.0, 15.0, 10.0, 5.0, 2.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.68994140625, -0.670623779296875, -0.65130615234375, -0.631988525390625, -0.6126708984375, -0.593353271484375, -0.57403564453125, -0.554718017578125, -0.535400390625, -0.516082763671875, -0.49676513671875, -0.477447509765625, -0.4581298828125, -0.438812255859375, -0.41949462890625, -0.400177001953125, -0.380859375, -0.361541748046875, -0.34222412109375, -0.322906494140625, -0.3035888671875, -0.284271240234375, -0.26495361328125, -0.245635986328125, -0.226318359375, -0.207000732421875, -0.18768310546875, -0.168365478515625, -0.1490478515625, -0.129730224609375, -0.11041259765625, -0.091094970703125, -0.07177734375, -0.052459716796875, -0.03314208984375, -0.013824462890625, 0.0054931640625, 0.024810791015625, 0.04412841796875, 0.063446044921875, 0.082763671875, 0.102081298828125, 0.12139892578125, 0.140716552734375, 0.1600341796875, 0.179351806640625, 0.19866943359375, 0.217987060546875, 0.2373046875, 0.256622314453125, 0.27593994140625, 0.295257568359375, 0.3145751953125, 0.333892822265625, 0.35321044921875, 0.372528076171875, 0.391845703125, 0.411163330078125, 0.43048095703125, 0.449798583984375, 0.4691162109375, 0.488433837890625, 0.50775146484375, 0.527069091796875, 0.54638671875]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 9.0, 23.0, 35.0, 47.0, 86.0, 145.0, 187.0, 174.0, 119.0, 68.0, 49.0, 20.0, 23.0, 8.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1480159759521484, -3.045922040939331, -2.9438281059265137, -2.8417341709136963, -2.739640235900879, -2.6375465393066406, -2.5354526042938232, -2.433358669281006, -2.3312647342681885, -2.229170799255371, -2.1270768642425537, -2.0249829292297363, -1.9228891134262085, -1.8207951784133911, -1.7187013626098633, -1.616607427597046, -1.5145134925842285, -1.4124195575714111, -1.3103256225585938, -1.208231806755066, -1.1061378717422485, -1.0040439367294312, -0.9019500613212585, -0.7998561859130859, -0.6977622509002686, -0.5956683158874512, -0.49357444047927856, -0.39148053526878357, -0.2893866300582886, -0.1872926950454712, -0.08519881963729858, 0.016895055770874023, 0.1189889907836914, 0.2210828959941864, 0.3231768012046814, 0.4252707064151764, 0.5273646116256714, 0.6294585466384888, 0.7315524220466614, 0.833646297454834, 0.9357402324676514, 1.0378341674804688, 1.1399281024932861, 1.242021918296814, 1.3441158533096313, 1.4462097883224487, 1.5483036041259766, 1.650397539138794, 1.7524914741516113, 1.8545854091644287, 1.956679344177246, 2.0587732791900635, 2.160867214202881, 2.262960910797119, 2.3650548458099365, 2.467148780822754, 2.5692427158355713, 2.6713366508483887, 2.773430585861206, 2.8755245208740234, 2.9776182174682617, 3.079712390899658, 3.1818060874938965, 3.283900022506714, 3.3859939575195312]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 6.0, 8.0, 10.0, 8.0, 9.0, 17.0, 17.0, 30.0, 39.0, 28.0, 39.0, 36.0, 47.0, 41.0, 40.0, 46.0, 68.0, 56.0, 51.0, 46.0, 49.0, 44.0, 35.0, 34.0, 35.0, 30.0, 18.0, 24.0, 18.0, 13.0, 15.0, 10.0, 9.0, 8.0, 7.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.5459598302841187, -1.4918259382247925, -1.4376921653747559, -1.3835582733154297, -1.3294243812561035, -1.275290608406067, -1.2211567163467407, -1.167022943496704, -1.112889051437378, -1.0587551593780518, -1.0046213865280151, -0.950487494468689, -0.8963536620140076, -0.8422198295593262, -0.7880859375, -0.7339521050453186, -0.6798182725906372, -0.6256844401359558, -0.5715506076812744, -0.5174167156219482, -0.46328288316726685, -0.40914905071258545, -0.35501518845558167, -0.3008813261985779, -0.24674749374389648, -0.1926136463880539, -0.1384797990322113, -0.08434595167636871, -0.030212104320526123, 0.023921728134155273, 0.07805559039115906, 0.13218945264816284, 0.1863234043121338, 0.24045725166797638, 0.29459109902381897, 0.34872496128082275, 0.40285879373550415, 0.45699262619018555, 0.5111265182495117, 0.5652603507041931, 0.6193941831588745, 0.6735280156135559, 0.7276618480682373, 0.7817957401275635, 0.8359295725822449, 0.8900634050369263, 0.9441972970962524, 0.9983311295509338, 1.0524649620056152, 1.1065988540649414, 1.160732626914978, 1.2148665189743042, 1.2690002918243408, 1.323134183883667, 1.3772680759429932, 1.4314019680023193, 1.485535740852356, 1.5396696329116821, 1.5938034057617188, 1.647937297821045, 1.702071189880371, 1.7562049627304077, 1.8103388547897339, 1.8644726276397705, 1.9186065196990967]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 4.0, 9.0, 7.0, 11.0, 22.0, 30.0, 42.0, 56.0, 64.0, 132.0, 184.0, 291.0, 473.0, 867.0, 1504.0, 2831.0, 6262.0, 17450.0, 69233.0, 334411.0, 463733.0, 110032.0, 25040.0, 8135.0, 3417.0, 1749.0, 976.0, 568.0, 375.0, 219.0, 160.0, 102.0, 57.0, 42.0, 19.0, 11.0, 10.0, 6.0, 6.0, 2.0, 3.0, 1.0, 4.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-1.8974609375, -1.8345184326171875, -1.771575927734375, -1.7086334228515625, -1.64569091796875, -1.5827484130859375, -1.519805908203125, -1.4568634033203125, -1.3939208984375, -1.3309783935546875, -1.268035888671875, -1.2050933837890625, -1.14215087890625, -1.0792083740234375, -1.016265869140625, -0.9533233642578125, -0.890380859375, -0.8274383544921875, -0.764495849609375, -0.7015533447265625, -0.63861083984375, -0.5756683349609375, -0.512725830078125, -0.4497833251953125, -0.3868408203125, -0.3238983154296875, -0.260955810546875, -0.1980133056640625, -0.13507080078125, -0.0721282958984375, -0.009185791015625, 0.0537567138671875, 0.11669921875, 0.1796417236328125, 0.242584228515625, 0.3055267333984375, 0.36846923828125, 0.4314117431640625, 0.494354248046875, 0.5572967529296875, 0.6202392578125, 0.6831817626953125, 0.746124267578125, 0.8090667724609375, 0.87200927734375, 0.9349517822265625, 0.997894287109375, 1.0608367919921875, 1.123779296875, 1.1867218017578125, 1.249664306640625, 1.3126068115234375, 1.37554931640625, 1.4384918212890625, 1.501434326171875, 1.5643768310546875, 1.6273193359375, 1.6902618408203125, 1.753204345703125, 1.8161468505859375, 1.87908935546875, 1.9420318603515625, 2.004974365234375, 2.0679168701171875, 2.130859375]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 3.0, 4.0, 6.0, 10.0, 13.0, 9.0, 29.0, 27.0, 50.0, 52.0, 71.0, 92.0, 80.0, 91.0, 88.0, 86.0, 65.0, 59.0, 45.0, 38.0, 32.0, 16.0, 10.0, 7.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.497314453125, -0.4833412170410156, -0.46936798095703125, -0.4553947448730469, -0.4414215087890625, -0.4274482727050781, -0.41347503662109375, -0.3995018005371094, -0.385528564453125, -0.3715553283691406, -0.35758209228515625, -0.3436088562011719, -0.3296356201171875, -0.3156623840332031, -0.30168914794921875, -0.2877159118652344, -0.27374267578125, -0.2597694396972656, -0.24579620361328125, -0.23182296752929688, -0.2178497314453125, -0.20387649536132812, -0.18990325927734375, -0.17593002319335938, -0.161956787109375, -0.14798355102539062, -0.13401031494140625, -0.12003707885742188, -0.1060638427734375, -0.09209060668945312, -0.07811737060546875, -0.06414413452148438, -0.0501708984375, -0.036197662353515625, -0.02222442626953125, -0.008251190185546875, 0.0057220458984375, 0.019695281982421875, 0.03366851806640625, 0.047641754150390625, 0.061614990234375, 0.07558822631835938, 0.08956146240234375, 0.10353469848632812, 0.1175079345703125, 0.13148117065429688, 0.14545440673828125, 0.15942764282226562, 0.17340087890625, 0.18737411499023438, 0.20134735107421875, 0.21532058715820312, 0.2292938232421875, 0.24326705932617188, 0.25724029541015625, 0.2712135314941406, 0.285186767578125, 0.2991600036621094, 0.31313323974609375, 0.3271064758300781, 0.3410797119140625, 0.3550529479980469, 0.36902618408203125, 0.3829994201660156, 0.39697265625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 8.0, 12.0, 10.0, 25.0, 32.0, 50.0, 55.0, 89.0, 128.0, 179.0, 319.0, 598.0, 1185.0, 2516.0, 6352.0, 19212.0, 75328.0, 366338.0, 442402.0, 96914.0, 23372.0, 7519.0, 2929.0, 1292.0, 631.0, 386.0, 243.0, 157.0, 97.0, 55.0, 30.0, 21.0, 26.0, 20.0, 6.0, 6.0, 8.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7490234375, -1.6945037841796875, -1.639984130859375, -1.5854644775390625, -1.53094482421875, -1.4764251708984375, -1.421905517578125, -1.3673858642578125, -1.3128662109375, -1.2583465576171875, -1.203826904296875, -1.1493072509765625, -1.09478759765625, -1.0402679443359375, -0.985748291015625, -0.9312286376953125, -0.876708984375, -0.8221893310546875, -0.767669677734375, -0.7131500244140625, -0.65863037109375, -0.6041107177734375, -0.549591064453125, -0.4950714111328125, -0.4405517578125, -0.3860321044921875, -0.331512451171875, -0.2769927978515625, -0.22247314453125, -0.1679534912109375, -0.113433837890625, -0.0589141845703125, -0.00439453125, 0.0501251220703125, 0.104644775390625, 0.1591644287109375, 0.21368408203125, 0.2682037353515625, 0.322723388671875, 0.3772430419921875, 0.4317626953125, 0.4862823486328125, 0.540802001953125, 0.5953216552734375, 0.64984130859375, 0.7043609619140625, 0.758880615234375, 0.8134002685546875, 0.867919921875, 0.9224395751953125, 0.976959228515625, 1.0314788818359375, 1.08599853515625, 1.1405181884765625, 1.195037841796875, 1.2495574951171875, 1.3040771484375, 1.3585968017578125, 1.413116455078125, 1.4676361083984375, 1.52215576171875, 1.5766754150390625, 1.631195068359375, 1.6857147216796875, 1.740234375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 6.0, 6.0, 3.0, 5.0, 3.0, 6.0, 10.0, 12.0, 13.0, 27.0, 29.0, 36.0, 35.0, 46.0, 53.0, 62.0, 63.0, 63.0, 50.0, 61.0, 72.0, 55.0, 62.0, 37.0, 30.0, 35.0, 30.0, 21.0, 14.0, 12.0, 14.0, 11.0, 9.0, 3.0, 6.0, 3.0, 1.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.94140625, -1.8896026611328125, -1.837799072265625, -1.7859954833984375, -1.73419189453125, -1.6823883056640625, -1.630584716796875, -1.5787811279296875, -1.5269775390625, -1.4751739501953125, -1.423370361328125, -1.3715667724609375, -1.31976318359375, -1.2679595947265625, -1.216156005859375, -1.1643524169921875, -1.112548828125, -1.0607452392578125, -1.008941650390625, -0.9571380615234375, -0.90533447265625, -0.8535308837890625, -0.801727294921875, -0.7499237060546875, -0.6981201171875, -0.6463165283203125, -0.594512939453125, -0.5427093505859375, -0.49090576171875, -0.4391021728515625, -0.387298583984375, -0.3354949951171875, -0.28369140625, -0.2318878173828125, -0.180084228515625, -0.1282806396484375, -0.07647705078125, -0.0246734619140625, 0.027130126953125, 0.0789337158203125, 0.1307373046875, 0.1825408935546875, 0.234344482421875, 0.2861480712890625, 0.33795166015625, 0.3897552490234375, 0.441558837890625, 0.4933624267578125, 0.545166015625, 0.5969696044921875, 0.648773193359375, 0.7005767822265625, 0.75238037109375, 0.8041839599609375, 0.855987548828125, 0.9077911376953125, 0.9595947265625, 1.0113983154296875, 1.063201904296875, 1.1150054931640625, 1.16680908203125, 1.2186126708984375, 1.270416259765625, 1.3222198486328125, 1.3740234375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 5.0, 7.0, 11.0, 11.0, 14.0, 27.0, 55.0, 93.0, 167.0, 308.0, 704.0, 1895.0, 6973.0, 48827.0, 671121.0, 291244.0, 20693.0, 4006.0, 1302.0, 514.0, 255.0, 139.0, 72.0, 54.0, 18.0, 13.0, 12.0, 5.0, 4.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.05859375, -1.0281829833984375, -0.997772216796875, -0.9673614501953125, -0.93695068359375, -0.9065399169921875, -0.876129150390625, -0.8457183837890625, -0.8153076171875, -0.7848968505859375, -0.754486083984375, -0.7240753173828125, -0.69366455078125, -0.6632537841796875, -0.632843017578125, -0.6024322509765625, -0.572021484375, -0.5416107177734375, -0.511199951171875, -0.4807891845703125, -0.45037841796875, -0.4199676513671875, -0.389556884765625, -0.3591461181640625, -0.3287353515625, -0.2983245849609375, -0.267913818359375, -0.2375030517578125, -0.20709228515625, -0.1766815185546875, -0.146270751953125, -0.1158599853515625, -0.08544921875, -0.0550384521484375, -0.024627685546875, 0.0057830810546875, 0.03619384765625, 0.0666046142578125, 0.097015380859375, 0.1274261474609375, 0.1578369140625, 0.1882476806640625, 0.218658447265625, 0.2490692138671875, 0.27947998046875, 0.3098907470703125, 0.340301513671875, 0.3707122802734375, 0.401123046875, 0.4315338134765625, 0.461944580078125, 0.4923553466796875, 0.52276611328125, 0.5531768798828125, 0.583587646484375, 0.6139984130859375, 0.6444091796875, 0.6748199462890625, 0.705230712890625, 0.7356414794921875, 0.76605224609375, 0.7964630126953125, 0.826873779296875, 0.8572845458984375, 0.8876953125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 7.0, 9.0, 11.0, 25.0, 23.0, 25.0, 41.0, 60.0, 72.0, 88.0, 98.0, 104.0, 96.0, 81.0, 65.0, 52.0, 44.0, 28.0, 19.0, 14.0, 7.0, 4.0, 12.0, 7.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011944770812988281, -0.00011563487350940704, -0.00011182203888893127, -0.0001080092042684555, -0.00010419636964797974, -0.00010038353502750397, -9.65707004070282e-05, -9.275786578655243e-05, -8.894503116607666e-05, -8.513219654560089e-05, -8.131936192512512e-05, -7.750652730464935e-05, -7.369369268417358e-05, -6.988085806369781e-05, -6.606802344322205e-05, -6.225518882274628e-05, -5.844235420227051e-05, -5.462951958179474e-05, -5.081668496131897e-05, -4.70038503408432e-05, -4.319101572036743e-05, -3.937818109989166e-05, -3.5565346479415894e-05, -3.1752511858940125e-05, -2.7939677238464355e-05, -2.4126842617988586e-05, -2.0314007997512817e-05, -1.650117337703705e-05, -1.268833875656128e-05, -8.87550413608551e-06, -5.062669515609741e-06, -1.2498348951339722e-06, 2.562999725341797e-06, 6.375834345817566e-06, 1.0188668966293335e-05, 1.4001503586769104e-05, 1.7814338207244873e-05, 2.1627172827720642e-05, 2.544000744819641e-05, 2.925284206867218e-05, 3.306567668914795e-05, 3.687851130962372e-05, 4.069134593009949e-05, 4.4504180550575256e-05, 4.8317015171051025e-05, 5.2129849791526794e-05, 5.5942684412002563e-05, 5.975551903247833e-05, 6.35683536529541e-05, 6.738118827342987e-05, 7.119402289390564e-05, 7.500685751438141e-05, 7.881969213485718e-05, 8.263252675533295e-05, 8.644536137580872e-05, 9.025819599628448e-05, 9.407103061676025e-05, 9.788386523723602e-05, 0.00010169669985771179, 0.00010550953447818756, 0.00010932236909866333, 0.0001131352037191391, 0.00011694803833961487, 0.00012076087296009064, 0.0001245737075805664]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 12.0, 9.0, 23.0, 33.0, 70.0, 119.0, 268.0, 698.0, 2157.0, 10511.0, 143935.0, 810995.0, 70055.0, 7029.0, 1591.0, 575.0, 252.0, 95.0, 45.0, 28.0, 24.0, 11.0, 9.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4365234375, -1.4041595458984375, -1.371795654296875, -1.3394317626953125, -1.30706787109375, -1.2747039794921875, -1.242340087890625, -1.2099761962890625, -1.1776123046875, -1.1452484130859375, -1.112884521484375, -1.0805206298828125, -1.04815673828125, -1.0157928466796875, -0.983428955078125, -0.9510650634765625, -0.918701171875, -0.8863372802734375, -0.853973388671875, -0.8216094970703125, -0.78924560546875, -0.7568817138671875, -0.724517822265625, -0.6921539306640625, -0.6597900390625, -0.6274261474609375, -0.595062255859375, -0.5626983642578125, -0.53033447265625, -0.4979705810546875, -0.465606689453125, -0.4332427978515625, -0.40087890625, -0.3685150146484375, -0.336151123046875, -0.3037872314453125, -0.27142333984375, -0.2390594482421875, -0.206695556640625, -0.1743316650390625, -0.1419677734375, -0.1096038818359375, -0.077239990234375, -0.0448760986328125, -0.01251220703125, 0.0198516845703125, 0.052215576171875, 0.0845794677734375, 0.116943359375, 0.1493072509765625, 0.181671142578125, 0.2140350341796875, 0.24639892578125, 0.2787628173828125, 0.311126708984375, 0.3434906005859375, 0.3758544921875, 0.4082183837890625, 0.440582275390625, 0.4729461669921875, 0.50531005859375, 0.5376739501953125, 0.570037841796875, 0.6024017333984375, 0.634765625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 2.0, 8.0, 10.0, 21.0, 19.0, 47.0, 31.0, 68.0, 92.0, 110.0, 122.0, 137.0, 97.0, 65.0, 56.0, 44.0, 23.0, 13.0, 12.0, 9.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.7294921875, -0.7124176025390625, -0.695343017578125, -0.6782684326171875, -0.66119384765625, -0.6441192626953125, -0.627044677734375, -0.6099700927734375, -0.5928955078125, -0.5758209228515625, -0.558746337890625, -0.5416717529296875, -0.52459716796875, -0.5075225830078125, -0.490447998046875, -0.4733734130859375, -0.456298828125, -0.4392242431640625, -0.422149658203125, -0.4050750732421875, -0.38800048828125, -0.3709259033203125, -0.353851318359375, -0.3367767333984375, -0.3197021484375, -0.3026275634765625, -0.285552978515625, -0.2684783935546875, -0.25140380859375, -0.2343292236328125, -0.217254638671875, -0.2001800537109375, -0.18310546875, -0.1660308837890625, -0.148956298828125, -0.1318817138671875, -0.11480712890625, -0.0977325439453125, -0.080657958984375, -0.0635833740234375, -0.0465087890625, -0.0294342041015625, -0.012359619140625, 0.0047149658203125, 0.02178955078125, 0.0388641357421875, 0.055938720703125, 0.0730133056640625, 0.090087890625, 0.1071624755859375, 0.124237060546875, 0.1413116455078125, 0.15838623046875, 0.1754608154296875, 0.192535400390625, 0.2096099853515625, 0.2266845703125, 0.2437591552734375, 0.260833740234375, 0.2779083251953125, 0.29498291015625, 0.3120574951171875, 0.329132080078125, 0.3462066650390625, 0.36328125]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 5.0, 11.0, 5.0, 7.0, 16.0, 20.0, 34.0, 47.0, 81.0, 120.0, 162.0, 158.0, 126.0, 69.0, 53.0, 39.0, 18.0, 14.0, 8.0, 5.0, 2.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-12.183361053466797, -11.862210273742676, -11.541058540344238, -11.219907760620117, -10.898756980895996, -10.577606201171875, -10.256454467773438, -9.935303688049316, -9.614152908325195, -9.293002128601074, -8.971850395202637, -8.650699615478516, -8.329548835754395, -8.008398056030273, -7.687246322631836, -7.366095542907715, -7.044943809509277, -6.723792552947998, -6.402641773223877, -6.081490516662598, -5.760339736938477, -5.439188480377197, -5.118037223815918, -4.796886444091797, -4.475735187530518, -4.154583930969238, -3.833433151245117, -3.512281894683838, -3.1911308765411377, -2.8699798583984375, -2.548828601837158, -2.227677583694458, -1.9065256118774414, -1.5853745937347412, -1.2642234563827515, -0.9430723786354065, -0.6219213008880615, -0.30077028274536133, 0.020380854606628418, 0.34153199195861816, 0.6626830101013184, 0.9838340878486633, 1.3049851655960083, 1.626136302947998, 1.9472873210906982, 2.2684383392333984, 2.5895895957946777, 2.910740613937378, 3.231891632080078, 3.5530426502227783, 3.8741936683654785, 4.195344924926758, 4.516495704650879, 4.837646961212158, 5.1587982177734375, 5.479948997497559, 5.801100254058838, 6.122251510620117, 6.443402290344238, 6.764553546905518, 7.085704803466797, 7.406855583190918, 7.728006839752197, 8.049158096313477, 8.370308876037598]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 8.0, 5.0, 12.0, 15.0, 21.0, 25.0, 25.0, 47.0, 43.0, 65.0, 51.0, 59.0, 85.0, 79.0, 75.0, 84.0, 67.0, 54.0, 30.0, 36.0, 26.0, 32.0, 13.0, 14.0, 15.0, 2.0, 6.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-16.267683029174805, -15.89025592803955, -15.51282787322998, -15.135400772094727, -14.757972717285156, -14.380545616149902, -14.003117561340332, -13.625690460205078, -13.248262405395508, -12.870835304260254, -12.493407249450684, -12.11598014831543, -11.73855209350586, -11.361124992370605, -10.983696937561035, -10.606269836425781, -10.228841781616211, -9.851414680480957, -9.473986625671387, -9.096559524536133, -8.719131469726562, -8.341704368591309, -7.964276313781738, -7.586849212646484, -7.2094221115112305, -6.831994533538818, -6.454566955566406, -6.077139377593994, -5.699711799621582, -5.32228422164917, -4.944856643676758, -4.567429542541504, -4.190001487731934, -3.8125739097595215, -3.4351463317871094, -3.0577187538146973, -2.680291175842285, -2.302863597869873, -1.92543625831604, -1.548008680343628, -1.1705811023712158, -0.7931535243988037, -0.4157260060310364, -0.03829848766326904, 0.33912909030914307, 0.7165566682815552, 1.0939841270446777, 1.4714117050170898, 1.848839282989502, 2.226266860961914, 2.603694438934326, 2.9811220169067383, 3.3585495948791504, 3.7359771728515625, 4.113404273986816, 4.490832328796387, 4.868259429931641, 5.245687007904053, 5.623114585876465, 6.000542163848877, 6.377969741821289, 6.755397319793701, 7.132824897766113, 7.510251998901367, 7.8876800537109375]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 8.0, 10.0, 15.0, 17.0, 20.0, 28.0, 27.0, 44.0, 39.0, 55.0, 66.0, 106.0, 122.0, 196.0, 262.0, 365.0, 586.0, 1003.0, 1834.0, 3794.0, 8953.0, 27618.0, 151565.0, 3674503.0, 265498.0, 36975.0, 11083.0, 4393.0, 2130.0, 1082.0, 636.0, 430.0, 245.0, 160.0, 108.0, 74.0, 61.0, 37.0, 31.0, 22.0, 22.0, 22.0, 10.0, 9.0, 4.0, 6.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-2.4140625, -2.34222412109375, -2.2703857421875, -2.19854736328125, -2.126708984375, -2.05487060546875, -1.9830322265625, -1.91119384765625, -1.83935546875, -1.76751708984375, -1.6956787109375, -1.62384033203125, -1.552001953125, -1.48016357421875, -1.4083251953125, -1.33648681640625, -1.2646484375, -1.19281005859375, -1.1209716796875, -1.04913330078125, -0.977294921875, -0.90545654296875, -0.8336181640625, -0.76177978515625, -0.68994140625, -0.61810302734375, -0.5462646484375, -0.47442626953125, -0.402587890625, -0.33074951171875, -0.2589111328125, -0.18707275390625, -0.115234375, -0.04339599609375, 0.0284423828125, 0.10028076171875, 0.172119140625, 0.24395751953125, 0.3157958984375, 0.38763427734375, 0.45947265625, 0.53131103515625, 0.6031494140625, 0.67498779296875, 0.746826171875, 0.81866455078125, 0.8905029296875, 0.96234130859375, 1.0341796875, 1.10601806640625, 1.1778564453125, 1.24969482421875, 1.321533203125, 1.39337158203125, 1.4652099609375, 1.53704833984375, 1.60888671875, 1.68072509765625, 1.7525634765625, 1.82440185546875, 1.896240234375, 1.96807861328125, 2.0399169921875, 2.11175537109375, 2.18359375]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 6.0, 2.0, 12.0, 18.0, 20.0, 31.0, 53.0, 56.0, 71.0, 88.0, 94.0, 91.0, 89.0, 69.0, 77.0, 51.0, 46.0, 39.0, 30.0, 17.0, 10.0, 9.0, 5.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.47998046875, -0.466064453125, -0.4521484375, -0.438232421875, -0.42431640625, -0.410400390625, -0.396484375, -0.382568359375, -0.36865234375, -0.354736328125, -0.3408203125, -0.326904296875, -0.31298828125, -0.299072265625, -0.28515625, -0.271240234375, -0.25732421875, -0.243408203125, -0.2294921875, -0.215576171875, -0.20166015625, -0.187744140625, -0.173828125, -0.159912109375, -0.14599609375, -0.132080078125, -0.1181640625, -0.104248046875, -0.09033203125, -0.076416015625, -0.0625, -0.048583984375, -0.03466796875, -0.020751953125, -0.0068359375, 0.007080078125, 0.02099609375, 0.034912109375, 0.048828125, 0.062744140625, 0.07666015625, 0.090576171875, 0.1044921875, 0.118408203125, 0.13232421875, 0.146240234375, 0.16015625, 0.174072265625, 0.18798828125, 0.201904296875, 0.2158203125, 0.229736328125, 0.24365234375, 0.257568359375, 0.271484375, 0.285400390625, 0.29931640625, 0.313232421875, 0.3271484375, 0.341064453125, 0.35498046875, 0.368896484375, 0.3828125, 0.396728515625, 0.41064453125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 2.0, 4.0, 3.0, 2.0, 3.0, 8.0, 7.0, 18.0, 46.0, 78.0, 112.0, 234.0, 507.0, 1160.0, 2944.0, 8940.0, 48239.0, 3818852.0, 286479.0, 18504.0, 4893.0, 1762.0, 715.0, 337.0, 172.0, 99.0, 59.0, 30.0, 27.0, 11.0, 13.0, 8.0, 6.0, 8.0, 0.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.8984375, -2.7813720703125, -2.664306640625, -2.5472412109375, -2.43017578125, -2.3131103515625, -2.196044921875, -2.0789794921875, -1.9619140625, -1.8448486328125, -1.727783203125, -1.6107177734375, -1.49365234375, -1.3765869140625, -1.259521484375, -1.1424560546875, -1.025390625, -0.9083251953125, -0.791259765625, -0.6741943359375, -0.55712890625, -0.4400634765625, -0.322998046875, -0.2059326171875, -0.0888671875, 0.0281982421875, 0.145263671875, 0.2623291015625, 0.37939453125, 0.4964599609375, 0.613525390625, 0.7305908203125, 0.84765625, 0.9647216796875, 1.081787109375, 1.1988525390625, 1.31591796875, 1.4329833984375, 1.550048828125, 1.6671142578125, 1.7841796875, 1.9012451171875, 2.018310546875, 2.1353759765625, 2.25244140625, 2.3695068359375, 2.486572265625, 2.6036376953125, 2.720703125, 2.8377685546875, 2.954833984375, 3.0718994140625, 3.18896484375, 3.3060302734375, 3.423095703125, 3.5401611328125, 3.6572265625, 3.7742919921875, 3.891357421875, 4.0084228515625, 4.12548828125, 4.2425537109375, 4.359619140625, 4.4766845703125, 4.59375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 6.0, 4.0, 5.0, 6.0, 7.0, 17.0, 17.0, 29.0, 76.0, 127.0, 368.0, 2040.0, 932.0, 244.0, 85.0, 44.0, 27.0, 11.0, 5.0, 6.0, 5.0, 6.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9921875, -0.9521484375, -0.912109375, -0.8720703125, -0.83203125, -0.7919921875, -0.751953125, -0.7119140625, -0.671875, -0.6318359375, -0.591796875, -0.5517578125, -0.51171875, -0.4716796875, -0.431640625, -0.3916015625, -0.3515625, -0.3115234375, -0.271484375, -0.2314453125, -0.19140625, -0.1513671875, -0.111328125, -0.0712890625, -0.03125, 0.0087890625, 0.048828125, 0.0888671875, 0.12890625, 0.1689453125, 0.208984375, 0.2490234375, 0.2890625, 0.3291015625, 0.369140625, 0.4091796875, 0.44921875, 0.4892578125, 0.529296875, 0.5693359375, 0.609375, 0.6494140625, 0.689453125, 0.7294921875, 0.76953125, 0.8095703125, 0.849609375, 0.8896484375, 0.9296875, 0.9697265625, 1.009765625, 1.0498046875, 1.08984375, 1.1298828125, 1.169921875, 1.2099609375, 1.25, 1.2900390625, 1.330078125, 1.3701171875, 1.41015625, 1.4501953125, 1.490234375, 1.5302734375, 1.5703125]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 7.0, 11.0, 35.0, 143.0, 305.0, 305.0, 125.0, 42.0, 17.0, 6.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.918496131896973, -13.593974113464355, -13.269453048706055, -12.944931030273438, -12.62040901184082, -12.29588794708252, -11.971365928649902, -11.646844863891602, -11.322322845458984, -10.997800827026367, -10.673279762268066, -10.34875774383545, -10.024236679077148, -9.699714660644531, -9.375192642211914, -9.050670623779297, -8.726149559020996, -8.401627540588379, -8.077106475830078, -7.752584457397461, -7.428062915802002, -7.103541374206543, -6.779019355773926, -6.454497814178467, -6.129976272583008, -5.805454730987549, -5.48093318939209, -5.156411170959473, -4.831889629364014, -4.507368087768555, -4.1828460693359375, -3.8583245277404785, -3.5338029861450195, -3.2092814445495605, -2.8847596645355225, -2.5602378845214844, -2.2357163429260254, -1.9111946821212769, -1.5866730213165283, -1.2621512413024902, -0.9376296997070312, -0.6131080389022827, -0.2885863780975342, 0.035935282707214355, 0.3604569435119629, 0.6849786043167114, 1.00950026512146, 1.334022045135498, 1.658543586730957, 1.9830652475357056, 2.307586908340454, 2.632108688354492, 2.956630229949951, 3.28115177154541, 3.6056735515594482, 3.9301953315734863, 4.254716873168945, 4.579238414764404, 4.903759956359863, 5.2282819747924805, 5.5528035163879395, 5.877325057983398, 6.201847076416016, 6.526368618011475, 6.850890159606934]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 11.0, 8.0, 8.0, 9.0, 25.0, 25.0, 34.0, 38.0, 57.0, 55.0, 67.0, 63.0, 94.0, 73.0, 80.0, 79.0, 62.0, 52.0, 38.0, 40.0, 28.0, 21.0, 15.0, 5.0, 6.0, 1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.513881683349609, -4.385019302368164, -4.256156921386719, -4.127294063568115, -3.99843168258667, -3.8695693016052246, -3.7407069206237793, -3.611844539642334, -3.4829819202423096, -3.3541195392608643, -3.22525691986084, -3.0963945388793945, -2.967532157897949, -2.838669538497925, -2.7098071575164795, -2.580944538116455, -2.4520821571350098, -2.3232197761535645, -2.19435715675354, -2.0654947757720947, -1.9366322755813599, -1.807769775390625, -1.6789073944091797, -1.5500448942184448, -1.42118239402771, -1.292319893836975, -1.1634573936462402, -1.034595012664795, -0.9057325124740601, -0.7768700122833252, -0.6480075716972351, -0.519145131111145, -0.39028310775756836, -0.2614206373691559, -0.1325581669807434, -0.0036956965923309326, 0.12516677379608154, 0.2540292739868164, 0.3828917145729065, 0.5117541551589966, 0.6406166553497314, 0.7694791555404663, 0.8983415961265564, 1.0272040367126465, 1.1560665369033813, 1.2849290370941162, 1.4137914180755615, 1.5426539182662964, 1.6715164184570312, 1.8003789186477661, 1.929241418838501, 2.0581037998199463, 2.1869664192199707, 2.315828800201416, 2.4446911811828613, 2.5735535621643066, 2.702416181564331, 2.8312785625457764, 2.960141181945801, 3.089003562927246, 3.2178659439086914, 3.346728563308716, 3.475590944290161, 3.6044535636901855, 3.733315944671631]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 9.0, 4.0, 9.0, 5.0, 13.0, 15.0, 19.0, 25.0, 28.0, 49.0, 50.0, 78.0, 97.0, 145.0, 215.0, 268.0, 394.0, 572.0, 800.0, 1341.0, 2155.0, 4026.0, 9110.0, 29719.0, 147955.0, 547188.0, 236848.0, 43495.0, 11920.0, 4794.0, 2552.0, 1566.0, 945.0, 659.0, 425.0, 288.0, 201.0, 161.0, 99.0, 78.0, 57.0, 42.0, 34.0, 18.0, 23.0, 11.0, 18.0, 9.0, 5.0, 8.0, 7.0, 1.0, 6.0, 5.0, 1.0, 1.0, 1.0], "bins": [-1.9375, -1.8781280517578125, -1.818756103515625, -1.7593841552734375, -1.70001220703125, -1.6406402587890625, -1.581268310546875, -1.5218963623046875, -1.4625244140625, -1.4031524658203125, -1.343780517578125, -1.2844085693359375, -1.22503662109375, -1.1656646728515625, -1.106292724609375, -1.0469207763671875, -0.987548828125, -0.9281768798828125, -0.868804931640625, -0.8094329833984375, -0.75006103515625, -0.6906890869140625, -0.631317138671875, -0.5719451904296875, -0.5125732421875, -0.4532012939453125, -0.393829345703125, -0.3344573974609375, -0.27508544921875, -0.2157135009765625, -0.156341552734375, -0.0969696044921875, -0.03759765625, 0.0217742919921875, 0.081146240234375, 0.1405181884765625, 0.19989013671875, 0.2592620849609375, 0.318634033203125, 0.3780059814453125, 0.4373779296875, 0.4967498779296875, 0.556121826171875, 0.6154937744140625, 0.67486572265625, 0.7342376708984375, 0.793609619140625, 0.8529815673828125, 0.912353515625, 0.9717254638671875, 1.031097412109375, 1.0904693603515625, 1.14984130859375, 1.2092132568359375, 1.268585205078125, 1.3279571533203125, 1.3873291015625, 1.4467010498046875, 1.506072998046875, 1.5654449462890625, 1.62481689453125, 1.6841888427734375, 1.743560791015625, 1.8029327392578125, 1.8623046875]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 5.0, 5.0, 3.0, 9.0, 14.0, 18.0, 35.0, 45.0, 70.0, 95.0, 104.0, 139.0, 100.0, 109.0, 88.0, 53.0, 38.0, 25.0, 14.0, 17.0, 3.0, 3.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.6025390625, -0.5846481323242188, -0.5667572021484375, -0.5488662719726562, -0.530975341796875, -0.5130844116210938, -0.4951934814453125, -0.47730255126953125, -0.45941162109375, -0.44152069091796875, -0.4236297607421875, -0.40573883056640625, -0.387847900390625, -0.36995697021484375, -0.3520660400390625, -0.33417510986328125, -0.3162841796875, -0.29839324951171875, -0.2805023193359375, -0.26261138916015625, -0.244720458984375, -0.22682952880859375, -0.2089385986328125, -0.19104766845703125, -0.17315673828125, -0.15526580810546875, -0.1373748779296875, -0.11948394775390625, -0.101593017578125, -0.08370208740234375, -0.0658111572265625, -0.04792022705078125, -0.030029296875, -0.01213836669921875, 0.0057525634765625, 0.02364349365234375, 0.041534423828125, 0.05942535400390625, 0.0773162841796875, 0.09520721435546875, 0.11309814453125, 0.13098907470703125, 0.1488800048828125, 0.16677093505859375, 0.184661865234375, 0.20255279541015625, 0.2204437255859375, 0.23833465576171875, 0.2562255859375, 0.27411651611328125, 0.2920074462890625, 0.30989837646484375, 0.327789306640625, 0.34568023681640625, 0.3635711669921875, 0.38146209716796875, 0.39935302734375, 0.41724395751953125, 0.4351348876953125, 0.45302581787109375, 0.470916748046875, 0.48880767822265625, 0.5066986083984375, 0.5245895385742188, 0.54248046875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 7.0, 6.0, 11.0, 14.0, 15.0, 17.0, 29.0, 43.0, 57.0, 80.0, 91.0, 178.0, 289.0, 465.0, 853.0, 1622.0, 3329.0, 7738.0, 20960.0, 64275.0, 204074.0, 407638.0, 225997.0, 71943.0, 23205.0, 8342.0, 3452.0, 1580.0, 818.0, 460.0, 343.0, 197.0, 115.0, 75.0, 59.0, 56.0, 27.0, 30.0, 13.0, 14.0, 8.0, 9.0, 8.0, 4.0, 4.0, 1.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-1.0478515625, -1.015655517578125, -0.98345947265625, -0.951263427734375, -0.9190673828125, -0.886871337890625, -0.85467529296875, -0.822479248046875, -0.790283203125, -0.758087158203125, -0.72589111328125, -0.693695068359375, -0.6614990234375, -0.629302978515625, -0.59710693359375, -0.564910888671875, -0.53271484375, -0.500518798828125, -0.46832275390625, -0.436126708984375, -0.4039306640625, -0.371734619140625, -0.33953857421875, -0.307342529296875, -0.275146484375, -0.242950439453125, -0.21075439453125, -0.178558349609375, -0.1463623046875, -0.114166259765625, -0.08197021484375, -0.049774169921875, -0.017578125, 0.014617919921875, 0.04681396484375, 0.079010009765625, 0.1112060546875, 0.143402099609375, 0.17559814453125, 0.207794189453125, 0.239990234375, 0.272186279296875, 0.30438232421875, 0.336578369140625, 0.3687744140625, 0.400970458984375, 0.43316650390625, 0.465362548828125, 0.49755859375, 0.529754638671875, 0.56195068359375, 0.594146728515625, 0.6263427734375, 0.658538818359375, 0.69073486328125, 0.722930908203125, 0.755126953125, 0.787322998046875, 0.81951904296875, 0.851715087890625, 0.8839111328125, 0.916107177734375, 0.94830322265625, 0.980499267578125, 1.0126953125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 4.0, 3.0, 4.0, 3.0, 11.0, 10.0, 20.0, 24.0, 33.0, 35.0, 35.0, 44.0, 44.0, 39.0, 45.0, 49.0, 49.0, 52.0, 50.0, 47.0, 47.0, 39.0, 26.0, 41.0, 42.0, 40.0, 25.0, 28.0, 20.0, 18.0, 20.0, 14.0, 8.0, 8.0, 4.0, 4.0, 6.0, 5.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.07421875, -1.0384674072265625, -1.002716064453125, -0.9669647216796875, -0.93121337890625, -0.8954620361328125, -0.859710693359375, -0.8239593505859375, -0.7882080078125, -0.7524566650390625, -0.716705322265625, -0.6809539794921875, -0.64520263671875, -0.6094512939453125, -0.573699951171875, -0.5379486083984375, -0.502197265625, -0.4664459228515625, -0.430694580078125, -0.3949432373046875, -0.35919189453125, -0.3234405517578125, -0.287689208984375, -0.2519378662109375, -0.2161865234375, -0.1804351806640625, -0.144683837890625, -0.1089324951171875, -0.07318115234375, -0.0374298095703125, -0.001678466796875, 0.0340728759765625, 0.06982421875, 0.1055755615234375, 0.141326904296875, 0.1770782470703125, 0.21282958984375, 0.2485809326171875, 0.284332275390625, 0.3200836181640625, 0.3558349609375, 0.3915863037109375, 0.427337646484375, 0.4630889892578125, 0.49884033203125, 0.5345916748046875, 0.570343017578125, 0.6060943603515625, 0.641845703125, 0.6775970458984375, 0.713348388671875, 0.7490997314453125, 0.78485107421875, 0.8206024169921875, 0.856353759765625, 0.8921051025390625, 0.9278564453125, 0.9636077880859375, 0.999359130859375, 1.0351104736328125, 1.07086181640625, 1.1066131591796875, 1.142364501953125, 1.1781158447265625, 1.2138671875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 12.0, 9.0, 20.0, 25.0, 36.0, 79.0, 140.0, 286.0, 689.0, 2442.0, 14629.0, 336289.0, 660035.0, 28585.0, 3648.0, 928.0, 324.0, 143.0, 84.0, 48.0, 47.0, 23.0, 16.0, 10.0, 5.0, 1.0, 7.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4130859375, -1.3769760131835938, -1.3408660888671875, -1.3047561645507812, -1.268646240234375, -1.2325363159179688, -1.1964263916015625, -1.1603164672851562, -1.12420654296875, -1.0880966186523438, -1.0519866943359375, -1.0158767700195312, -0.979766845703125, -0.9436569213867188, -0.9075469970703125, -0.8714370727539062, -0.8353271484375, -0.7992172241210938, -0.7631072998046875, -0.7269973754882812, -0.690887451171875, -0.6547775268554688, -0.6186676025390625, -0.5825576782226562, -0.54644775390625, -0.5103378295898438, -0.4742279052734375, -0.43811798095703125, -0.402008056640625, -0.36589813232421875, -0.3297882080078125, -0.29367828369140625, -0.257568359375, -0.22145843505859375, -0.1853485107421875, -0.14923858642578125, -0.113128662109375, -0.07701873779296875, -0.0409088134765625, -0.00479888916015625, 0.03131103515625, 0.06742095947265625, 0.1035308837890625, 0.13964080810546875, 0.175750732421875, 0.21186065673828125, 0.2479705810546875, 0.28408050537109375, 0.3201904296875, 0.35630035400390625, 0.3924102783203125, 0.42852020263671875, 0.464630126953125, 0.5007400512695312, 0.5368499755859375, 0.5729598999023438, 0.60906982421875, 0.6451797485351562, 0.6812896728515625, 0.7173995971679688, 0.753509521484375, 0.7896194458007812, 0.8257293701171875, 0.8618392944335938, 0.89794921875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 5.0, 19.0, 25.0, 22.0, 48.0, 72.0, 151.0, 186.0, 185.0, 124.0, 79.0, 45.0, 27.0, 13.0, 4.0, 4.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00029659271240234375, -0.0002903798595070839, -0.00028416700661182404, -0.0002779541537165642, -0.0002717413008213043, -0.00026552844792604446, -0.0002593155950307846, -0.00025310274213552475, -0.0002468898892402649, -0.00024067703634500504, -0.00023446418344974518, -0.00022825133055448532, -0.00022203847765922546, -0.0002158256247639656, -0.00020961277186870575, -0.0002033999189734459, -0.00019718706607818604, -0.00019097421318292618, -0.00018476136028766632, -0.00017854850739240646, -0.0001723356544971466, -0.00016612280160188675, -0.0001599099487066269, -0.00015369709581136703, -0.00014748424291610718, -0.00014127139002084732, -0.00013505853712558746, -0.0001288456842303276, -0.00012263283133506775, -0.00011641997843980789, -0.00011020712554454803, -0.00010399427264928818, -9.778141975402832e-05, -9.156856685876846e-05, -8.53557139635086e-05, -7.914286106824875e-05, -7.293000817298889e-05, -6.671715527772903e-05, -6.050430238246918e-05, -5.429144948720932e-05, -4.807859659194946e-05, -4.1865743696689606e-05, -3.565289080142975e-05, -2.944003790616989e-05, -2.3227185010910034e-05, -1.7014332115650177e-05, -1.080147922039032e-05, -4.588626325130463e-06, 1.6242265701293945e-06, 7.837079465389252e-06, 1.4049932360649109e-05, 2.0262785255908966e-05, 2.6475638151168823e-05, 3.268849104642868e-05, 3.890134394168854e-05, 4.5114196836948395e-05, 5.132704973220825e-05, 5.753990262746811e-05, 6.375275552272797e-05, 6.996560841798782e-05, 7.617846131324768e-05, 8.239131420850754e-05, 8.86041671037674e-05, 9.481701999902725e-05, 0.00010102987289428711]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 5.0, 5.0, 4.0, 10.0, 11.0, 18.0, 18.0, 34.0, 64.0, 122.0, 178.0, 432.0, 877.0, 2112.0, 6519.0, 27920.0, 183318.0, 594887.0, 192797.0, 28529.0, 6717.0, 2236.0, 844.0, 421.0, 223.0, 97.0, 59.0, 38.0, 25.0, 17.0, 9.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52490234375, -0.5064926147460938, -0.4880828857421875, -0.46967315673828125, -0.451263427734375, -0.43285369873046875, -0.4144439697265625, -0.39603424072265625, -0.37762451171875, -0.35921478271484375, -0.3408050537109375, -0.32239532470703125, -0.303985595703125, -0.28557586669921875, -0.2671661376953125, -0.24875640869140625, -0.2303466796875, -0.21193695068359375, -0.1935272216796875, -0.17511749267578125, -0.156707763671875, -0.13829803466796875, -0.1198883056640625, -0.10147857666015625, -0.08306884765625, -0.06465911865234375, -0.0462493896484375, -0.02783966064453125, -0.009429931640625, 0.00897979736328125, 0.0273895263671875, 0.04579925537109375, 0.064208984375, 0.08261871337890625, 0.1010284423828125, 0.11943817138671875, 0.137847900390625, 0.15625762939453125, 0.1746673583984375, 0.19307708740234375, 0.21148681640625, 0.22989654541015625, 0.2483062744140625, 0.26671600341796875, 0.285125732421875, 0.30353546142578125, 0.3219451904296875, 0.34035491943359375, 0.3587646484375, 0.37717437744140625, 0.3955841064453125, 0.41399383544921875, 0.432403564453125, 0.45081329345703125, 0.4692230224609375, 0.48763275146484375, 0.50604248046875, 0.5244522094726562, 0.5428619384765625, 0.5612716674804688, 0.579681396484375, 0.5980911254882812, 0.6165008544921875, 0.6349105834960938, 0.6533203125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 6.0, 7.0, 8.0, 19.0, 16.0, 22.0, 34.0, 40.0, 59.0, 64.0, 79.0, 105.0, 78.0, 87.0, 75.0, 64.0, 66.0, 33.0, 41.0, 25.0, 21.0, 16.0, 10.0, 6.0, 4.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.359375, -0.34468841552734375, -0.3300018310546875, -0.31531524658203125, -0.300628662109375, -0.28594207763671875, -0.2712554931640625, -0.25656890869140625, -0.24188232421875, -0.22719573974609375, -0.2125091552734375, -0.19782257080078125, -0.183135986328125, -0.16844940185546875, -0.1537628173828125, -0.13907623291015625, -0.1243896484375, -0.10970306396484375, -0.0950164794921875, -0.08032989501953125, -0.065643310546875, -0.05095672607421875, -0.0362701416015625, -0.02158355712890625, -0.00689697265625, 0.00778961181640625, 0.0224761962890625, 0.03716278076171875, 0.051849365234375, 0.06653594970703125, 0.0812225341796875, 0.09590911865234375, 0.110595703125, 0.12528228759765625, 0.1399688720703125, 0.15465545654296875, 0.169342041015625, 0.18402862548828125, 0.1987152099609375, 0.21340179443359375, 0.22808837890625, 0.24277496337890625, 0.2574615478515625, 0.27214813232421875, 0.286834716796875, 0.30152130126953125, 0.3162078857421875, 0.33089447021484375, 0.3455810546875, 0.36026763916015625, 0.3749542236328125, 0.38964080810546875, 0.404327392578125, 0.41901397705078125, 0.4337005615234375, 0.44838714599609375, 0.46307373046875, 0.47776031494140625, 0.4924468994140625, 0.5071334838867188, 0.521820068359375, 0.5365066528320312, 0.5511932373046875, 0.5658798217773438, 0.58056640625]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 0.0, 1.0, 4.0, 14.0, 26.0, 68.0, 129.0, 227.0, 242.0, 156.0, 58.0, 45.0, 21.0, 7.0, 3.0, 3.0, 0.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.999469757080078, -18.576515197753906, -18.153560638427734, -17.730607986450195, -17.307653427124023, -16.88469886779785, -16.46174430847168, -16.03879165649414, -15.615837097167969, -15.192882537841797, -14.769928932189941, -14.34697437286377, -13.924020767211914, -13.501066207885742, -13.07811164855957, -12.655158042907715, -12.232203483581543, -11.809248924255371, -11.386295318603516, -10.963340759277344, -10.540387153625488, -10.117432594299316, -9.694478988647461, -9.271524429321289, -8.848569869995117, -8.425615310668945, -8.00266170501709, -7.579707145690918, -7.1567535400390625, -6.733798980712891, -6.310844898223877, -5.887890815734863, -5.464937210083008, -5.041983127593994, -4.6190290451049805, -4.196074485778809, -3.773120641708374, -3.3501665592193604, -2.9272122383117676, -2.504258155822754, -2.0813040733337402, -1.6583499908447266, -1.2353957891464233, -0.8124415874481201, -0.38948750495910645, 0.03346657752990723, 0.4564208984375, 0.8793749809265137, 1.3023290634155273, 1.725283145904541, 2.1482372283935547, 2.5711915493011475, 2.994145631790161, 3.417099714279175, 3.8400540351867676, 4.263008117675781, 4.685962200164795, 5.108916282653809, 5.531870365142822, 5.954824447631836, 6.377779006958008, 6.800732612609863, 7.223687171936035, 7.646641254425049, 8.069595336914062]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 7.0, 5.0, 8.0, 21.0, 15.0, 22.0, 20.0, 26.0, 31.0, 37.0, 31.0, 46.0, 51.0, 52.0, 69.0, 64.0, 67.0, 57.0, 46.0, 60.0, 47.0, 33.0, 43.0, 35.0, 30.0, 19.0, 20.0, 8.0, 14.0, 14.0, 3.0, 1.0, 5.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.585875034332275, -7.340003490447998, -7.094131946563721, -6.848260402679443, -6.602388858795166, -6.356517314910889, -6.1106462478637695, -5.864774703979492, -5.618903160095215, -5.3730316162109375, -5.12716007232666, -4.881288528442383, -4.6354169845581055, -4.389545440673828, -4.143673896789551, -3.8978025913238525, -3.651930809020996, -3.4060592651367188, -3.1601877212524414, -2.914316177368164, -2.6684446334838867, -2.4225730895996094, -2.176701784133911, -1.9308302402496338, -1.6849586963653564, -1.439087152481079, -1.1932156085968018, -0.947344183921814, -0.7014726400375366, -0.4556010961532593, -0.20972967147827148, 0.03614187240600586, 0.282012939453125, 0.5278844833374023, 0.7737559676170349, 1.0196274518966675, 1.2654989957809448, 1.5113705396652222, 1.75724196434021, 2.0031135082244873, 2.2489850521087646, 2.494856595993042, 2.7407281398773193, 2.9865994453430176, 3.232470989227295, 3.4783425331115723, 3.7242140769958496, 3.970085620880127, 4.215957164764404, 4.461828708648682, 4.707700252532959, 4.953571796417236, 5.199443340301514, 5.445314884185791, 5.69118595123291, 5.9370574951171875, 6.182929039001465, 6.428800582885742, 6.6746721267700195, 6.920543670654297, 7.166415214538574, 7.412286758422852, 7.658158302307129, 7.904029846191406, 8.149901390075684]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 2.0, 6.0, 3.0, 4.0, 10.0, 21.0, 9.0, 24.0, 32.0, 43.0, 85.0, 136.0, 233.0, 407.0, 736.0, 1454.0, 4116.0, 21644.0, 1121111.0, 3012390.0, 24269.0, 4391.0, 1522.0, 737.0, 330.0, 221.0, 138.0, 83.0, 42.0, 20.0, 20.0, 14.0, 6.0, 7.0, 7.0, 4.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0], "bins": [-3.50390625, -3.409271240234375, -3.31463623046875, -3.220001220703125, -3.1253662109375, -3.030731201171875, -2.93609619140625, -2.841461181640625, -2.746826171875, -2.652191162109375, -2.55755615234375, -2.462921142578125, -2.3682861328125, -2.273651123046875, -2.17901611328125, -2.084381103515625, -1.98974609375, -1.895111083984375, -1.80047607421875, -1.705841064453125, -1.6112060546875, -1.516571044921875, -1.42193603515625, -1.327301025390625, -1.232666015625, -1.138031005859375, -1.04339599609375, -0.948760986328125, -0.8541259765625, -0.759490966796875, -0.66485595703125, -0.570220947265625, -0.4755859375, -0.380950927734375, -0.28631591796875, -0.191680908203125, -0.0970458984375, -0.002410888671875, 0.09222412109375, 0.186859130859375, 0.281494140625, 0.376129150390625, 0.47076416015625, 0.565399169921875, 0.6600341796875, 0.754669189453125, 0.84930419921875, 0.943939208984375, 1.03857421875, 1.133209228515625, 1.22784423828125, 1.322479248046875, 1.4171142578125, 1.511749267578125, 1.60638427734375, 1.701019287109375, 1.795654296875, 1.890289306640625, 1.98492431640625, 2.079559326171875, 2.1741943359375, 2.268829345703125, 2.36346435546875, 2.458099365234375, 2.552734375]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 8.0, 10.0, 19.0, 35.0, 27.0, 77.0, 103.0, 110.0, 119.0, 122.0, 94.0, 89.0, 71.0, 34.0, 23.0, 24.0, 8.0, 6.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.63525390625, -0.6164703369140625, -0.597686767578125, -0.5789031982421875, -0.56011962890625, -0.5413360595703125, -0.522552490234375, -0.5037689208984375, -0.4849853515625, -0.4662017822265625, -0.447418212890625, -0.4286346435546875, -0.40985107421875, -0.3910675048828125, -0.372283935546875, -0.3535003662109375, -0.334716796875, -0.3159332275390625, -0.297149658203125, -0.2783660888671875, -0.25958251953125, -0.2407989501953125, -0.222015380859375, -0.2032318115234375, -0.1844482421875, -0.1656646728515625, -0.146881103515625, -0.1280975341796875, -0.10931396484375, -0.0905303955078125, -0.071746826171875, -0.0529632568359375, -0.0341796875, -0.0153961181640625, 0.003387451171875, 0.0221710205078125, 0.04095458984375, 0.0597381591796875, 0.078521728515625, 0.0973052978515625, 0.1160888671875, 0.1348724365234375, 0.153656005859375, 0.1724395751953125, 0.19122314453125, 0.2100067138671875, 0.228790283203125, 0.2475738525390625, 0.266357421875, 0.2851409912109375, 0.303924560546875, 0.3227081298828125, 0.34149169921875, 0.3602752685546875, 0.379058837890625, 0.3978424072265625, 0.4166259765625, 0.4354095458984375, 0.454193115234375, 0.4729766845703125, 0.49176025390625, 0.5105438232421875, 0.529327392578125, 0.5481109619140625, 0.56689453125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 7.0, 6.0, 13.0, 10.0, 16.0, 28.0, 47.0, 65.0, 104.0, 169.0, 282.0, 528.0, 1124.0, 2770.0, 11407.0, 96060.0, 3834917.0, 222057.0, 18116.0, 3854.0, 1395.0, 625.0, 277.0, 152.0, 70.0, 52.0, 61.0, 22.0, 17.0, 15.0, 11.0, 5.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.544921875, -2.4822845458984375, -2.419647216796875, -2.3570098876953125, -2.29437255859375, -2.2317352294921875, -2.169097900390625, -2.1064605712890625, -2.0438232421875, -1.9811859130859375, -1.918548583984375, -1.8559112548828125, -1.79327392578125, -1.7306365966796875, -1.667999267578125, -1.6053619384765625, -1.542724609375, -1.4800872802734375, -1.417449951171875, -1.3548126220703125, -1.29217529296875, -1.2295379638671875, -1.166900634765625, -1.1042633056640625, -1.0416259765625, -0.9789886474609375, -0.916351318359375, -0.8537139892578125, -0.79107666015625, -0.7284393310546875, -0.665802001953125, -0.6031646728515625, -0.54052734375, -0.4778900146484375, -0.415252685546875, -0.3526153564453125, -0.28997802734375, -0.2273406982421875, -0.164703369140625, -0.1020660400390625, -0.0394287109375, 0.0232086181640625, 0.085845947265625, 0.1484832763671875, 0.21112060546875, 0.2737579345703125, 0.336395263671875, 0.3990325927734375, 0.461669921875, 0.5243072509765625, 0.586944580078125, 0.6495819091796875, 0.71221923828125, 0.7748565673828125, 0.837493896484375, 0.9001312255859375, 0.9627685546875, 1.0254058837890625, 1.088043212890625, 1.1506805419921875, 1.21331787109375, 1.2759552001953125, 1.338592529296875, 1.4012298583984375, 1.4638671875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 7.0, 9.0, 16.0, 29.0, 55.0, 140.0, 373.0, 2223.0, 848.0, 190.0, 74.0, 46.0, 33.0, 11.0, 7.0, 7.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1083984375, -1.0830612182617188, -1.0577239990234375, -1.0323867797851562, -1.007049560546875, -0.9817123413085938, -0.9563751220703125, -0.9310379028320312, -0.90570068359375, -0.8803634643554688, -0.8550262451171875, -0.8296890258789062, -0.804351806640625, -0.7790145874023438, -0.7536773681640625, -0.7283401489257812, -0.7030029296875, -0.6776657104492188, -0.6523284912109375, -0.6269912719726562, -0.601654052734375, -0.5763168334960938, -0.5509796142578125, -0.5256423950195312, -0.50030517578125, -0.47496795654296875, -0.4496307373046875, -0.42429351806640625, -0.398956298828125, -0.37361907958984375, -0.3482818603515625, -0.32294464111328125, -0.297607421875, -0.27227020263671875, -0.2469329833984375, -0.22159576416015625, -0.196258544921875, -0.17092132568359375, -0.1455841064453125, -0.12024688720703125, -0.09490966796875, -0.06957244873046875, -0.0442352294921875, -0.01889801025390625, 0.006439208984375, 0.03177642822265625, 0.0571136474609375, 0.08245086669921875, 0.1077880859375, 0.13312530517578125, 0.1584625244140625, 0.18379974365234375, 0.209136962890625, 0.23447418212890625, 0.2598114013671875, 0.28514862060546875, 0.31048583984375, 0.33582305908203125, 0.3611602783203125, 0.38649749755859375, 0.411834716796875, 0.43717193603515625, 0.4625091552734375, 0.48784637451171875, 0.51318359375]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 22.0, 44.0, 113.0, 188.0, 246.0, 213.0, 94.0, 39.0, 22.0, 14.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.731424808502197, -5.589971542358398, -5.4485182762146, -5.307065486907959, -5.16561222076416, -5.024158954620361, -4.8827056884765625, -4.741252422332764, -4.599799156188965, -4.458345890045166, -4.316892623901367, -4.175439834594727, -4.033986568450928, -3.892533302307129, -3.75108003616333, -3.6096267700195312, -3.4681739807128906, -3.326720714569092, -3.185267686843872, -3.0438144207000732, -2.9023613929748535, -2.7609081268310547, -2.619454860687256, -2.478001594543457, -2.3365485668182373, -2.1950953006744385, -2.0536422729492188, -1.91218900680542, -1.7707358598709106, -1.6292827129364014, -1.4878294467926025, -1.3463762998580933, -1.2049236297607422, -1.063470482826233, -0.9220172762870789, -0.7805640697479248, -0.6391109228134155, -0.49765777587890625, -0.3562045693397522, -0.21475136280059814, -0.07329821586608887, 0.0681549608707428, 0.20960813760757446, 0.35106131434440613, 0.4925144910812378, 0.6339676380157471, 0.7754208445549011, 0.9168740510940552, 1.0583271980285645, 1.1997803449630737, 1.341233491897583, 1.4826867580413818, 1.6241399049758911, 1.7655930519104004, 1.9070463180541992, 2.048499584197998, 2.1899526119232178, 2.3314058780670166, 2.4728589057922363, 2.614312171936035, 2.755765438079834, 2.8972184658050537, 3.0386717319488525, 3.1801247596740723, 3.321578025817871]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 3.0, 6.0, 5.0, 9.0, 11.0, 10.0, 12.0, 13.0, 31.0, 29.0, 32.0, 43.0, 36.0, 34.0, 55.0, 45.0, 50.0, 56.0, 54.0, 52.0, 63.0, 45.0, 36.0, 36.0, 46.0, 37.0, 29.0, 22.0, 23.0, 24.0, 10.0, 8.0, 12.0, 9.0, 4.0, 4.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8159911632537842, -1.7610372304916382, -1.7060832977294922, -1.6511292457580566, -1.5961753129959106, -1.5412213802337646, -1.4862674474716187, -1.4313135147094727, -1.376359462738037, -1.3214055299758911, -1.2664515972137451, -1.2114975452423096, -1.1565436124801636, -1.1015896797180176, -1.0466357469558716, -0.9916818141937256, -0.9367278814315796, -0.8817739486694336, -0.8268199563026428, -0.7718660235404968, -0.716912031173706, -0.6619580984115601, -0.6070041656494141, -0.5520502328872681, -0.4970962405204773, -0.4421422779560089, -0.3871883153915405, -0.33223438262939453, -0.27728042006492615, -0.22232645750045776, -0.16737252473831177, -0.11241856217384338, -0.057464599609375, -0.002510644495487213, 0.052443310618400574, 0.10739725828170776, 0.16235122084617615, 0.21730518341064453, 0.2722591161727905, 0.3272130787372589, 0.3821670413017273, 0.4371210038661957, 0.49207496643066406, 0.5470288991928101, 0.601982831954956, 0.6569368243217468, 0.7118907570838928, 0.7668447494506836, 0.8217986822128296, 0.8767526149749756, 0.9317066073417664, 0.9866605401039124, 1.0416145324707031, 1.0965684652328491, 1.1515223979949951, 1.2064763307571411, 1.261430263519287, 1.316384196281433, 1.371338129043579, 1.4262921810150146, 1.4812461137771606, 1.5362000465393066, 1.5911539793014526, 1.6461079120635986, 1.7010619640350342]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 5.0, 12.0, 8.0, 20.0, 12.0, 28.0, 26.0, 47.0, 62.0, 100.0, 111.0, 163.0, 237.0, 363.0, 485.0, 723.0, 1046.0, 1715.0, 2884.0, 6307.0, 19033.0, 90177.0, 452068.0, 375415.0, 68958.0, 15558.0, 5386.0, 2770.0, 1582.0, 1012.0, 704.0, 460.0, 323.0, 195.0, 151.0, 104.0, 82.0, 65.0, 54.0, 30.0, 22.0, 13.0, 19.0, 10.0, 9.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.677734375, -1.61541748046875, -1.5531005859375, -1.49078369140625, -1.428466796875, -1.36614990234375, -1.3038330078125, -1.24151611328125, -1.17919921875, -1.11688232421875, -1.0545654296875, -0.99224853515625, -0.929931640625, -0.86761474609375, -0.8052978515625, -0.74298095703125, -0.6806640625, -0.61834716796875, -0.5560302734375, -0.49371337890625, -0.431396484375, -0.36907958984375, -0.3067626953125, -0.24444580078125, -0.18212890625, -0.11981201171875, -0.0574951171875, 0.00482177734375, 0.067138671875, 0.12945556640625, 0.1917724609375, 0.25408935546875, 0.31640625, 0.37872314453125, 0.4410400390625, 0.50335693359375, 0.565673828125, 0.62799072265625, 0.6903076171875, 0.75262451171875, 0.81494140625, 0.87725830078125, 0.9395751953125, 1.00189208984375, 1.064208984375, 1.12652587890625, 1.1888427734375, 1.25115966796875, 1.3134765625, 1.37579345703125, 1.4381103515625, 1.50042724609375, 1.562744140625, 1.62506103515625, 1.6873779296875, 1.74969482421875, 1.81201171875, 1.87432861328125, 1.9366455078125, 1.99896240234375, 2.061279296875, 2.12359619140625, 2.1859130859375, 2.24822998046875, 2.310546875]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 4.0, 6.0, 6.0, 6.0, 30.0, 28.0, 62.0, 70.0, 111.0, 112.0, 134.0, 110.0, 109.0, 78.0, 52.0, 33.0, 20.0, 10.0, 4.0, 6.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.65185546875, -0.63232421875, -0.61279296875, -0.59326171875, -0.57373046875, -0.55419921875, -0.53466796875, -0.51513671875, -0.49560546875, -0.47607421875, -0.45654296875, -0.43701171875, -0.41748046875, -0.39794921875, -0.37841796875, -0.35888671875, -0.33935546875, -0.31982421875, -0.30029296875, -0.28076171875, -0.26123046875, -0.24169921875, -0.22216796875, -0.20263671875, -0.18310546875, -0.16357421875, -0.14404296875, -0.12451171875, -0.10498046875, -0.08544921875, -0.06591796875, -0.04638671875, -0.02685546875, -0.00732421875, 0.01220703125, 0.03173828125, 0.05126953125, 0.07080078125, 0.09033203125, 0.10986328125, 0.12939453125, 0.14892578125, 0.16845703125, 0.18798828125, 0.20751953125, 0.22705078125, 0.24658203125, 0.26611328125, 0.28564453125, 0.30517578125, 0.32470703125, 0.34423828125, 0.36376953125, 0.38330078125, 0.40283203125, 0.42236328125, 0.44189453125, 0.46142578125, 0.48095703125, 0.50048828125, 0.52001953125, 0.53955078125, 0.55908203125, 0.57861328125, 0.59814453125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 5.0, 7.0, 14.0, 20.0, 21.0, 42.0, 45.0, 59.0, 120.0, 173.0, 272.0, 565.0, 1141.0, 2746.0, 7596.0, 23118.0, 82573.0, 295424.0, 427337.0, 147784.0, 39729.0, 12031.0, 4135.0, 1711.0, 797.0, 403.0, 269.0, 155.0, 87.0, 61.0, 42.0, 23.0, 19.0, 10.0, 9.0, 7.0, 6.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.142578125, -1.10711669921875, -1.0716552734375, -1.03619384765625, -1.000732421875, -0.96527099609375, -0.9298095703125, -0.89434814453125, -0.85888671875, -0.82342529296875, -0.7879638671875, -0.75250244140625, -0.717041015625, -0.68157958984375, -0.6461181640625, -0.61065673828125, -0.5751953125, -0.53973388671875, -0.5042724609375, -0.46881103515625, -0.433349609375, -0.39788818359375, -0.3624267578125, -0.32696533203125, -0.29150390625, -0.25604248046875, -0.2205810546875, -0.18511962890625, -0.149658203125, -0.11419677734375, -0.0787353515625, -0.04327392578125, -0.0078125, 0.02764892578125, 0.0631103515625, 0.09857177734375, 0.134033203125, 0.16949462890625, 0.2049560546875, 0.24041748046875, 0.27587890625, 0.31134033203125, 0.3468017578125, 0.38226318359375, 0.417724609375, 0.45318603515625, 0.4886474609375, 0.52410888671875, 0.5595703125, 0.59503173828125, 0.6304931640625, 0.66595458984375, 0.701416015625, 0.73687744140625, 0.7723388671875, 0.80780029296875, 0.84326171875, 0.87872314453125, 0.9141845703125, 0.94964599609375, 0.985107421875, 1.02056884765625, 1.0560302734375, 1.09149169921875, 1.126953125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 8.0, 5.0, 7.0, 14.0, 10.0, 11.0, 22.0, 23.0, 38.0, 20.0, 35.0, 35.0, 56.0, 52.0, 62.0, 52.0, 50.0, 50.0, 56.0, 54.0, 52.0, 52.0, 44.0, 31.0, 31.0, 39.0, 21.0, 23.0, 16.0, 10.0, 7.0, 9.0, 6.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2412109375, -1.2007293701171875, -1.160247802734375, -1.1197662353515625, -1.07928466796875, -1.0388031005859375, -0.998321533203125, -0.9578399658203125, -0.9173583984375, -0.8768768310546875, -0.836395263671875, -0.7959136962890625, -0.75543212890625, -0.7149505615234375, -0.674468994140625, -0.6339874267578125, -0.593505859375, -0.5530242919921875, -0.512542724609375, -0.4720611572265625, -0.43157958984375, -0.3910980224609375, -0.350616455078125, -0.3101348876953125, -0.2696533203125, -0.2291717529296875, -0.188690185546875, -0.1482086181640625, -0.10772705078125, -0.0672454833984375, -0.026763916015625, 0.0137176513671875, 0.05419921875, 0.0946807861328125, 0.135162353515625, 0.1756439208984375, 0.21612548828125, 0.2566070556640625, 0.297088623046875, 0.3375701904296875, 0.3780517578125, 0.4185333251953125, 0.459014892578125, 0.4994964599609375, 0.53997802734375, 0.5804595947265625, 0.620941162109375, 0.6614227294921875, 0.701904296875, 0.7423858642578125, 0.782867431640625, 0.8233489990234375, 0.86383056640625, 0.9043121337890625, 0.944793701171875, 0.9852752685546875, 1.0257568359375, 1.0662384033203125, 1.106719970703125, 1.1472015380859375, 1.18768310546875, 1.2281646728515625, 1.268646240234375, 1.3091278076171875, 1.349609375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 8.0, 9.0, 16.0, 27.0, 39.0, 63.0, 103.0, 161.0, 282.0, 617.0, 1377.0, 4309.0, 20513.0, 162677.0, 629782.0, 196792.0, 24055.0, 4790.0, 1583.0, 634.0, 299.0, 172.0, 100.0, 46.0, 32.0, 21.0, 14.0, 10.0, 8.0, 4.0, 1.0, 5.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.669921875, -0.6505279541015625, -0.631134033203125, -0.6117401123046875, -0.59234619140625, -0.5729522705078125, -0.553558349609375, -0.5341644287109375, -0.5147705078125, -0.4953765869140625, -0.475982666015625, -0.4565887451171875, -0.43719482421875, -0.4178009033203125, -0.398406982421875, -0.3790130615234375, -0.359619140625, -0.3402252197265625, -0.320831298828125, -0.3014373779296875, -0.28204345703125, -0.2626495361328125, -0.243255615234375, -0.2238616943359375, -0.2044677734375, -0.1850738525390625, -0.165679931640625, -0.1462860107421875, -0.12689208984375, -0.1074981689453125, -0.088104248046875, -0.0687103271484375, -0.04931640625, -0.0299224853515625, -0.010528564453125, 0.0088653564453125, 0.02825927734375, 0.0476531982421875, 0.067047119140625, 0.0864410400390625, 0.1058349609375, 0.1252288818359375, 0.144622802734375, 0.1640167236328125, 0.18341064453125, 0.2028045654296875, 0.222198486328125, 0.2415924072265625, 0.260986328125, 0.2803802490234375, 0.299774169921875, 0.3191680908203125, 0.33856201171875, 0.3579559326171875, 0.377349853515625, 0.3967437744140625, 0.4161376953125, 0.4355316162109375, 0.454925537109375, 0.4743194580078125, 0.49371337890625, 0.5131072998046875, 0.532501220703125, 0.5518951416015625, 0.5712890625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 9.0, 9.0, 5.0, 7.0, 16.0, 20.0, 20.0, 28.0, 40.0, 39.0, 32.0, 66.0, 67.0, 90.0, 86.0, 91.0, 78.0, 63.0, 55.0, 45.0, 26.0, 20.0, 34.0, 12.0, 17.0, 8.0, 7.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0], "bins": [-0.00010198354721069336, -9.93385910987854e-05, -9.669363498687744e-05, -9.404867887496948e-05, -9.140372276306152e-05, -8.875876665115356e-05, -8.61138105392456e-05, -8.346885442733765e-05, -8.082389831542969e-05, -7.817894220352173e-05, -7.553398609161377e-05, -7.288902997970581e-05, -7.024407386779785e-05, -6.759911775588989e-05, -6.495416164398193e-05, -6.230920553207397e-05, -5.9664249420166016e-05, -5.701929330825806e-05, -5.43743371963501e-05, -5.172938108444214e-05, -4.908442497253418e-05, -4.643946886062622e-05, -4.379451274871826e-05, -4.11495566368103e-05, -3.8504600524902344e-05, -3.5859644412994385e-05, -3.3214688301086426e-05, -3.056973218917847e-05, -2.7924776077270508e-05, -2.527981996536255e-05, -2.263486385345459e-05, -1.998990774154663e-05, -1.7344951629638672e-05, -1.4699995517730713e-05, -1.2055039405822754e-05, -9.410083293914795e-06, -6.765127182006836e-06, -4.120171070098877e-06, -1.475214958190918e-06, 1.169741153717041e-06, 3.814697265625e-06, 6.459653377532959e-06, 9.104609489440918e-06, 1.1749565601348877e-05, 1.4394521713256836e-05, 1.7039477825164795e-05, 1.9684433937072754e-05, 2.2329390048980713e-05, 2.4974346160888672e-05, 2.761930227279663e-05, 3.026425838470459e-05, 3.290921449661255e-05, 3.555417060852051e-05, 3.819912672042847e-05, 4.0844082832336426e-05, 4.3489038944244385e-05, 4.6133995056152344e-05, 4.87789511680603e-05, 5.142390727996826e-05, 5.406886339187622e-05, 5.671381950378418e-05, 5.935877561569214e-05, 6.20037317276001e-05, 6.464868783950806e-05, 6.729364395141602e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 9.0, 3.0, 5.0, 5.0, 12.0, 23.0, 34.0, 47.0, 92.0, 142.0, 247.0, 478.0, 925.0, 2345.0, 6628.0, 25313.0, 126810.0, 484769.0, 317235.0, 62270.0, 13981.0, 4137.0, 1531.0, 682.0, 365.0, 197.0, 103.0, 62.0, 45.0, 24.0, 11.0, 5.0, 8.0, 3.0, 2.0, 4.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.42236328125, -0.40769195556640625, -0.3930206298828125, -0.37834930419921875, -0.363677978515625, -0.34900665283203125, -0.3343353271484375, -0.31966400146484375, -0.30499267578125, -0.29032135009765625, -0.2756500244140625, -0.26097869873046875, -0.246307373046875, -0.23163604736328125, -0.2169647216796875, -0.20229339599609375, -0.1876220703125, -0.17295074462890625, -0.1582794189453125, -0.14360809326171875, -0.128936767578125, -0.11426544189453125, -0.0995941162109375, -0.08492279052734375, -0.07025146484375, -0.05558013916015625, -0.0409088134765625, -0.02623748779296875, -0.011566162109375, 0.00310516357421875, 0.0177764892578125, 0.03244781494140625, 0.047119140625, 0.06179046630859375, 0.0764617919921875, 0.09113311767578125, 0.105804443359375, 0.12047576904296875, 0.1351470947265625, 0.14981842041015625, 0.16448974609375, 0.17916107177734375, 0.1938323974609375, 0.20850372314453125, 0.223175048828125, 0.23784637451171875, 0.2525177001953125, 0.26718902587890625, 0.2818603515625, 0.29653167724609375, 0.3112030029296875, 0.32587432861328125, 0.340545654296875, 0.35521697998046875, 0.3698883056640625, 0.38455963134765625, 0.39923095703125, 0.41390228271484375, 0.4285736083984375, 0.44324493408203125, 0.457916259765625, 0.47258758544921875, 0.4872589111328125, 0.5019302368164062, 0.5166015625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 5.0, 3.0, 7.0, 7.0, 10.0, 11.0, 24.0, 39.0, 27.0, 48.0, 81.0, 93.0, 94.0, 116.0, 88.0, 84.0, 69.0, 47.0, 44.0, 30.0, 22.0, 17.0, 16.0, 10.0, 10.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.321533203125, -0.3066825866699219, -0.29183197021484375, -0.2769813537597656, -0.2621307373046875, -0.24728012084960938, -0.23242950439453125, -0.21757888793945312, -0.202728271484375, -0.18787765502929688, -0.17302703857421875, -0.15817642211914062, -0.1433258056640625, -0.12847518920898438, -0.11362457275390625, -0.09877395629882812, -0.08392333984375, -0.06907272338867188, -0.05422210693359375, -0.039371490478515625, -0.0245208740234375, -0.009670257568359375, 0.00518035888671875, 0.020030975341796875, 0.034881591796875, 0.049732208251953125, 0.06458282470703125, 0.07943344116210938, 0.0942840576171875, 0.10913467407226562, 0.12398529052734375, 0.13883590698242188, 0.1536865234375, 0.16853713989257812, 0.18338775634765625, 0.19823837280273438, 0.2130889892578125, 0.22793960571289062, 0.24279022216796875, 0.2576408386230469, 0.272491455078125, 0.2873420715332031, 0.30219268798828125, 0.3170433044433594, 0.3318939208984375, 0.3467445373535156, 0.36159515380859375, 0.3764457702636719, 0.39129638671875, 0.4061470031738281, 0.42099761962890625, 0.4358482360839844, 0.4506988525390625, 0.4655494689941406, 0.48040008544921875, 0.4952507019042969, 0.510101318359375, 0.5249519348144531, 0.5398025512695312, 0.5546531677246094, 0.5695037841796875, 0.5843544006347656, 0.5992050170898438, 0.6140556335449219, 0.62890625]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 6.0, 9.0, 2.0, 7.0, 10.0, 18.0, 21.0, 44.0, 57.0, 94.0, 142.0, 130.0, 140.0, 107.0, 79.0, 52.0, 29.0, 19.0, 17.0, 5.0, 3.0, 5.0, 6.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-8.574131965637207, -8.32158088684082, -8.069028854370117, -7.816477298736572, -7.563925743103027, -7.311374187469482, -7.0588226318359375, -6.806271076202393, -6.553719520568848, -6.301167964935303, -6.048616409301758, -5.796064853668213, -5.543513298034668, -5.290961742401123, -5.038410186767578, -4.785858631134033, -4.533307075500488, -4.280755519866943, -4.028203964233398, -3.7756524085998535, -3.5231008529663086, -3.2705492973327637, -3.0179977416992188, -2.765446186065674, -2.512894630432129, -2.260343074798584, -2.007791519165039, -1.7552399635314941, -1.5026884078979492, -1.2501368522644043, -0.9975852966308594, -0.7450337409973145, -0.49248218536376953, -0.2399306297302246, 0.012620925903320312, 0.26517248153686523, 0.5177240371704102, 0.7702755928039551, 1.0228271484375, 1.275378704071045, 1.5279302597045898, 1.7804818153381348, 2.0330333709716797, 2.2855849266052246, 2.5381364822387695, 2.7906880378723145, 3.0432395935058594, 3.2957911491394043, 3.548342704772949, 3.800894260406494, 4.053445816040039, 4.305997371673584, 4.558548927307129, 4.811100482940674, 5.063652038574219, 5.316203594207764, 5.568755149841309, 5.8213067054748535, 6.073858261108398, 6.326409816741943, 6.578961372375488, 6.831512928009033, 7.084064483642578, 7.336616039276123, 7.589167594909668]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 5.0, 4.0, 4.0, 7.0, 2.0, 8.0, 10.0, 17.0, 11.0, 16.0, 19.0, 25.0, 27.0, 25.0, 32.0, 30.0, 24.0, 34.0, 32.0, 38.0, 54.0, 42.0, 33.0, 50.0, 42.0, 32.0, 48.0, 38.0, 52.0, 36.0, 30.0, 29.0, 18.0, 18.0, 14.0, 16.0, 16.0, 11.0, 13.0, 15.0, 7.0, 9.0, 4.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.057811737060547, -4.880091667175293, -4.702371120452881, -4.524651050567627, -4.346930980682373, -4.169210433959961, -3.991490364074707, -3.813770055770874, -3.636049747467041, -3.458329439163208, -3.280609369277954, -3.102889060974121, -2.925168752670288, -2.747448444366455, -2.569728374481201, -2.392008066177368, -2.2142879962921143, -2.0365676879882812, -1.8588474988937378, -1.6811273097991943, -1.5034070014953613, -1.3256868124008179, -1.1479666233062744, -0.9702463150024414, -0.792526125907898, -0.6148058772087097, -0.43708565831184387, -0.259365439414978, -0.0816451907157898, 0.09607505798339844, 0.2737952470779419, 0.4515155553817749, 0.6292357444763184, 0.8069559931755066, 0.9846762418746948, 1.1623964309692383, 1.3401167392730713, 1.5178369283676147, 1.6955571174621582, 1.8732774257659912, 2.050997734069824, 2.2287180423736572, 2.406438112258911, 2.584158420562744, 2.761878728866577, 2.93959903717041, 3.117319107055664, 3.295039415359497, 3.472759485244751, 3.650479793548584, 3.828199863433838, 4.00592041015625, 4.183640480041504, 4.361360549926758, 4.539080619812012, 4.716801166534424, 4.894521236419678, 5.072241306304932, 5.249961853027344, 5.427681922912598, 5.605401992797852, 5.783122539520264, 5.960842609405518, 6.13856315612793, 6.316283226013184]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 6.0, 1.0, 6.0, 9.0, 10.0, 8.0, 19.0, 23.0, 33.0, 54.0, 78.0, 112.0, 211.0, 379.0, 635.0, 1261.0, 3009.0, 11725.0, 112893.0, 3965518.0, 83878.0, 9656.0, 2550.0, 1022.0, 486.0, 304.0, 138.0, 101.0, 52.0, 43.0, 17.0, 16.0, 15.0, 3.0, 4.0, 2.0, 6.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.1015625, -3.0059814453125, -2.910400390625, -2.8148193359375, -2.71923828125, -2.6236572265625, -2.528076171875, -2.4324951171875, -2.3369140625, -2.2413330078125, -2.145751953125, -2.0501708984375, -1.95458984375, -1.8590087890625, -1.763427734375, -1.6678466796875, -1.572265625, -1.4766845703125, -1.381103515625, -1.2855224609375, -1.18994140625, -1.0943603515625, -0.998779296875, -0.9031982421875, -0.8076171875, -0.7120361328125, -0.616455078125, -0.5208740234375, -0.42529296875, -0.3297119140625, -0.234130859375, -0.1385498046875, -0.04296875, 0.0526123046875, 0.148193359375, 0.2437744140625, 0.33935546875, 0.4349365234375, 0.530517578125, 0.6260986328125, 0.7216796875, 0.8172607421875, 0.912841796875, 1.0084228515625, 1.10400390625, 1.1995849609375, 1.295166015625, 1.3907470703125, 1.486328125, 1.5819091796875, 1.677490234375, 1.7730712890625, 1.86865234375, 1.9642333984375, 2.059814453125, 2.1553955078125, 2.2509765625, 2.3465576171875, 2.442138671875, 2.5377197265625, 2.63330078125, 2.7288818359375, 2.824462890625, 2.9200439453125, 3.015625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 8.0, 6.0, 11.0, 25.0, 28.0, 45.0, 72.0, 102.0, 112.0, 108.0, 120.0, 96.0, 84.0, 68.0, 40.0, 23.0, 18.0, 12.0, 9.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.6279296875, -0.6087417602539062, -0.5895538330078125, -0.5703659057617188, -0.551177978515625, -0.5319900512695312, -0.5128021240234375, -0.49361419677734375, -0.47442626953125, -0.45523834228515625, -0.4360504150390625, -0.41686248779296875, -0.397674560546875, -0.37848663330078125, -0.3592987060546875, -0.34011077880859375, -0.3209228515625, -0.30173492431640625, -0.2825469970703125, -0.26335906982421875, -0.244171142578125, -0.22498321533203125, -0.2057952880859375, -0.18660736083984375, -0.16741943359375, -0.14823150634765625, -0.1290435791015625, -0.10985565185546875, -0.090667724609375, -0.07147979736328125, -0.0522918701171875, -0.03310394287109375, -0.013916015625, 0.00527191162109375, 0.0244598388671875, 0.04364776611328125, 0.062835693359375, 0.08202362060546875, 0.1012115478515625, 0.12039947509765625, 0.13958740234375, 0.15877532958984375, 0.1779632568359375, 0.19715118408203125, 0.216339111328125, 0.23552703857421875, 0.2547149658203125, 0.27390289306640625, 0.2930908203125, 0.31227874755859375, 0.3314666748046875, 0.35065460205078125, 0.369842529296875, 0.38903045654296875, 0.4082183837890625, 0.42740631103515625, 0.44659423828125, 0.46578216552734375, 0.4849700927734375, 0.5041580200195312, 0.523345947265625, 0.5425338745117188, 0.5617218017578125, 0.5809097290039062, 0.60009765625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 3.0, 2.0, 9.0, 10.0, 9.0, 16.0, 14.0, 22.0, 48.0, 43.0, 70.0, 103.0, 165.0, 274.0, 468.0, 1213.0, 3821.0, 21926.0, 632759.0, 3479291.0, 45092.0, 5833.0, 1652.0, 561.0, 305.0, 152.0, 110.0, 79.0, 53.0, 47.0, 25.0, 30.0, 27.0, 9.0, 9.0, 9.0, 5.0, 4.0, 5.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1171875, -2.041961669921875, -1.96673583984375, -1.891510009765625, -1.8162841796875, -1.741058349609375, -1.66583251953125, -1.590606689453125, -1.515380859375, -1.440155029296875, -1.36492919921875, -1.289703369140625, -1.2144775390625, -1.139251708984375, -1.06402587890625, -0.988800048828125, -0.91357421875, -0.838348388671875, -0.76312255859375, -0.687896728515625, -0.6126708984375, -0.537445068359375, -0.46221923828125, -0.386993408203125, -0.311767578125, -0.236541748046875, -0.16131591796875, -0.086090087890625, -0.0108642578125, 0.064361572265625, 0.13958740234375, 0.214813232421875, 0.2900390625, 0.365264892578125, 0.44049072265625, 0.515716552734375, 0.5909423828125, 0.666168212890625, 0.74139404296875, 0.816619873046875, 0.891845703125, 0.967071533203125, 1.04229736328125, 1.117523193359375, 1.1927490234375, 1.267974853515625, 1.34320068359375, 1.418426513671875, 1.49365234375, 1.568878173828125, 1.64410400390625, 1.719329833984375, 1.7945556640625, 1.869781494140625, 1.94500732421875, 2.020233154296875, 2.095458984375, 2.170684814453125, 2.24591064453125, 2.321136474609375, 2.3963623046875, 2.471588134765625, 2.54681396484375, 2.622039794921875, 2.697265625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 6.0, 16.0, 37.0, 101.0, 441.0, 2614.0, 636.0, 134.0, 50.0, 20.0, 12.0, 7.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.115234375, -1.065948486328125, -1.01666259765625, -0.967376708984375, -0.9180908203125, -0.868804931640625, -0.81951904296875, -0.770233154296875, -0.720947265625, -0.671661376953125, -0.62237548828125, -0.573089599609375, -0.5238037109375, -0.474517822265625, -0.42523193359375, -0.375946044921875, -0.32666015625, -0.277374267578125, -0.22808837890625, -0.178802490234375, -0.1295166015625, -0.080230712890625, -0.03094482421875, 0.018341064453125, 0.067626953125, 0.116912841796875, 0.16619873046875, 0.215484619140625, 0.2647705078125, 0.314056396484375, 0.36334228515625, 0.412628173828125, 0.4619140625, 0.511199951171875, 0.56048583984375, 0.609771728515625, 0.6590576171875, 0.708343505859375, 0.75762939453125, 0.806915283203125, 0.856201171875, 0.905487060546875, 0.95477294921875, 1.004058837890625, 1.0533447265625, 1.102630615234375, 1.15191650390625, 1.201202392578125, 1.25048828125, 1.299774169921875, 1.34906005859375, 1.398345947265625, 1.4476318359375, 1.496917724609375, 1.54620361328125, 1.595489501953125, 1.644775390625, 1.694061279296875, 1.74334716796875, 1.792633056640625, 1.8419189453125, 1.891204833984375, 1.94049072265625, 1.989776611328125, 2.0390625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 9.0, 8.0, 33.0, 67.0, 154.0, 230.0, 236.0, 139.0, 68.0, 37.0, 14.0, 3.0, 6.0, 1.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.674568176269531, -7.492204666137695, -7.309841156005859, -7.127477645874023, -6.9451141357421875, -6.762750148773193, -6.580386638641357, -6.3980231285095215, -6.2156596183776855, -6.03329610824585, -5.850932598114014, -5.668569087982178, -5.486205101013184, -5.303841590881348, -5.121478080749512, -4.939114570617676, -4.75675106048584, -4.574387550354004, -4.392024040222168, -4.209660530090332, -4.027297019958496, -3.844933271408081, -3.662569522857666, -3.48020601272583, -3.297842502593994, -3.115478992462158, -2.9331154823303223, -2.7507517337799072, -2.5683882236480713, -2.3860247135162354, -2.2036609649658203, -2.0212974548339844, -1.8389344215393066, -1.6565709114074707, -1.4742072820663452, -1.2918436527252197, -1.1094801425933838, -0.9271165728569031, -0.7447530031204224, -0.5623893737792969, -0.38002586364746094, -0.19766229391098022, -0.015298724174499512, 0.1670648455619812, 0.3494284152984619, 0.5317919850349426, 0.7141555547714233, 0.8965191841125488, 1.0788826942443848, 1.2612462043762207, 1.4436098337173462, 1.6259734630584717, 1.8083369731903076, 1.9907004833221436, 2.1730642318725586, 2.3554277420043945, 2.5377912521362305, 2.7201547622680664, 2.9025182723999023, 3.0848820209503174, 3.2672455310821533, 3.4496090412139893, 3.6319727897644043, 3.8143362998962402, 3.996699810028076]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 5.0, 9.0, 11.0, 13.0, 11.0, 21.0, 28.0, 41.0, 42.0, 61.0, 51.0, 71.0, 81.0, 84.0, 84.0, 75.0, 57.0, 54.0, 58.0, 40.0, 33.0, 17.0, 24.0, 10.0, 11.0, 4.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.150228977203369, -3.053276538848877, -2.956324338912964, -2.859372138977051, -2.7624197006225586, -2.6654672622680664, -2.5685150623321533, -2.4715628623962402, -2.374610424041748, -2.277657985687256, -2.1807057857513428, -2.0837535858154297, -1.9868011474609375, -1.8898488283157349, -1.7928965091705322, -1.6959441900253296, -1.598991870880127, -1.5020395517349243, -1.4050872325897217, -1.308134913444519, -1.2111825942993164, -1.1142302751541138, -1.0172779560089111, -0.9203256368637085, -0.8233733177185059, -0.7264209985733032, -0.6294686794281006, -0.532516360282898, -0.4355640411376953, -0.3386117219924927, -0.24165940284729004, -0.1447070837020874, -0.047754764556884766, 0.04919755458831787, 0.1461498737335205, 0.24310219287872314, 0.3400545120239258, 0.4370068311691284, 0.533959150314331, 0.6309114694595337, 0.7278637886047363, 0.824816107749939, 0.9217684268951416, 1.0187207460403442, 1.1156730651855469, 1.2126253843307495, 1.3095777034759521, 1.4065300226211548, 1.5034823417663574, 1.60043466091156, 1.6973869800567627, 1.7943392992019653, 1.891291618347168, 1.9882439374923706, 2.0851962566375732, 2.1821484565734863, 2.2791008949279785, 2.3760533332824707, 2.473005533218384, 2.569957733154297, 2.666910171508789, 2.7638626098632812, 2.8608148097991943, 2.9577670097351074, 3.0547194480895996]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 5.0, 3.0, 12.0, 10.0, 11.0, 21.0, 29.0, 39.0, 55.0, 88.0, 155.0, 268.0, 411.0, 830.0, 1600.0, 3588.0, 10924.0, 81771.0, 742213.0, 179336.0, 18080.0, 4742.0, 2061.0, 997.0, 509.0, 271.0, 185.0, 112.0, 81.0, 42.0, 31.0, 20.0, 11.0, 4.0, 9.0, 4.0, 4.0, 3.0, 4.0, 3.0, 2.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.611328125, -2.52325439453125, -2.4351806640625, -2.34710693359375, -2.259033203125, -2.17095947265625, -2.0828857421875, -1.99481201171875, -1.90673828125, -1.81866455078125, -1.7305908203125, -1.64251708984375, -1.554443359375, -1.46636962890625, -1.3782958984375, -1.29022216796875, -1.2021484375, -1.11407470703125, -1.0260009765625, -0.93792724609375, -0.849853515625, -0.76177978515625, -0.6737060546875, -0.58563232421875, -0.49755859375, -0.40948486328125, -0.3214111328125, -0.23333740234375, -0.145263671875, -0.05718994140625, 0.0308837890625, 0.11895751953125, 0.20703125, 0.29510498046875, 0.3831787109375, 0.47125244140625, 0.559326171875, 0.64739990234375, 0.7354736328125, 0.82354736328125, 0.91162109375, 0.99969482421875, 1.0877685546875, 1.17584228515625, 1.263916015625, 1.35198974609375, 1.4400634765625, 1.52813720703125, 1.6162109375, 1.70428466796875, 1.7923583984375, 1.88043212890625, 1.968505859375, 2.05657958984375, 2.1446533203125, 2.23272705078125, 2.32080078125, 2.40887451171875, 2.4969482421875, 2.58502197265625, 2.673095703125, 2.76116943359375, 2.8492431640625, 2.93731689453125, 3.025390625]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 7.0, 11.0, 12.0, 25.0, 36.0, 53.0, 76.0, 104.0, 116.0, 114.0, 113.0, 108.0, 69.0, 59.0, 32.0, 23.0, 16.0, 8.0, 5.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.66552734375, -0.6450347900390625, -0.624542236328125, -0.6040496826171875, -0.58355712890625, -0.5630645751953125, -0.542572021484375, -0.5220794677734375, -0.5015869140625, -0.4810943603515625, -0.460601806640625, -0.4401092529296875, -0.41961669921875, -0.3991241455078125, -0.378631591796875, -0.3581390380859375, -0.337646484375, -0.3171539306640625, -0.296661376953125, -0.2761688232421875, -0.25567626953125, -0.2351837158203125, -0.214691162109375, -0.1941986083984375, -0.1737060546875, -0.1532135009765625, -0.132720947265625, -0.1122283935546875, -0.09173583984375, -0.0712432861328125, -0.050750732421875, -0.0302581787109375, -0.009765625, 0.0107269287109375, 0.031219482421875, 0.0517120361328125, 0.07220458984375, 0.0926971435546875, 0.113189697265625, 0.1336822509765625, 0.1541748046875, 0.1746673583984375, 0.195159912109375, 0.2156524658203125, 0.23614501953125, 0.2566375732421875, 0.277130126953125, 0.2976226806640625, 0.318115234375, 0.3386077880859375, 0.359100341796875, 0.3795928955078125, 0.40008544921875, 0.4205780029296875, 0.441070556640625, 0.4615631103515625, 0.4820556640625, 0.5025482177734375, 0.523040771484375, 0.5435333251953125, 0.56402587890625, 0.5845184326171875, 0.605010986328125, 0.6255035400390625, 0.64599609375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 4.0, 2.0, 1.0, 8.0, 9.0, 12.0, 14.0, 15.0, 24.0, 28.0, 41.0, 68.0, 93.0, 143.0, 212.0, 336.0, 679.0, 1482.0, 3619.0, 10272.0, 37078.0, 153646.0, 496753.0, 258198.0, 60478.0, 16191.0, 5098.0, 1969.0, 873.0, 420.0, 243.0, 175.0, 92.0, 68.0, 49.0, 41.0, 33.0, 21.0, 18.0, 10.0, 8.0, 7.0, 4.0, 7.0, 5.0, 5.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-1.220703125, -1.1855010986328125, -1.150299072265625, -1.1150970458984375, -1.07989501953125, -1.0446929931640625, -1.009490966796875, -0.9742889404296875, -0.9390869140625, -0.9038848876953125, -0.868682861328125, -0.8334808349609375, -0.79827880859375, -0.7630767822265625, -0.727874755859375, -0.6926727294921875, -0.657470703125, -0.6222686767578125, -0.587066650390625, -0.5518646240234375, -0.51666259765625, -0.4814605712890625, -0.446258544921875, -0.4110565185546875, -0.3758544921875, -0.3406524658203125, -0.305450439453125, -0.2702484130859375, -0.23504638671875, -0.1998443603515625, -0.164642333984375, -0.1294403076171875, -0.09423828125, -0.0590362548828125, -0.023834228515625, 0.0113677978515625, 0.04656982421875, 0.0817718505859375, 0.116973876953125, 0.1521759033203125, 0.1873779296875, 0.2225799560546875, 0.257781982421875, 0.2929840087890625, 0.32818603515625, 0.3633880615234375, 0.398590087890625, 0.4337921142578125, 0.468994140625, 0.5041961669921875, 0.539398193359375, 0.5746002197265625, 0.60980224609375, 0.6450042724609375, 0.680206298828125, 0.7154083251953125, 0.7506103515625, 0.7858123779296875, 0.821014404296875, 0.8562164306640625, 0.89141845703125, 0.9266204833984375, 0.961822509765625, 0.9970245361328125, 1.0322265625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 9.0, 7.0, 1.0, 9.0, 11.0, 10.0, 19.0, 19.0, 18.0, 29.0, 17.0, 18.0, 36.0, 29.0, 30.0, 37.0, 38.0, 40.0, 52.0, 45.0, 51.0, 36.0, 42.0, 42.0, 46.0, 33.0, 29.0, 32.0, 29.0, 33.0, 19.0, 22.0, 20.0, 17.0, 17.0, 15.0, 7.0, 5.0, 8.0, 5.0, 3.0, 2.0, 4.0, 5.0, 3.0, 0.0, 3.0, 0.0, 2.0, 3.0], "bins": [-1.1005859375, -1.0685272216796875, -1.036468505859375, -1.0044097900390625, -0.97235107421875, -0.9402923583984375, -0.908233642578125, -0.8761749267578125, -0.8441162109375, -0.8120574951171875, -0.779998779296875, -0.7479400634765625, -0.71588134765625, -0.6838226318359375, -0.651763916015625, -0.6197052001953125, -0.587646484375, -0.5555877685546875, -0.523529052734375, -0.4914703369140625, -0.45941162109375, -0.4273529052734375, -0.395294189453125, -0.3632354736328125, -0.3311767578125, -0.2991180419921875, -0.267059326171875, -0.2350006103515625, -0.20294189453125, -0.1708831787109375, -0.138824462890625, -0.1067657470703125, -0.07470703125, -0.0426483154296875, -0.010589599609375, 0.0214691162109375, 0.05352783203125, 0.0855865478515625, 0.117645263671875, 0.1497039794921875, 0.1817626953125, 0.2138214111328125, 0.245880126953125, 0.2779388427734375, 0.30999755859375, 0.3420562744140625, 0.374114990234375, 0.4061737060546875, 0.438232421875, 0.4702911376953125, 0.502349853515625, 0.5344085693359375, 0.56646728515625, 0.5985260009765625, 0.630584716796875, 0.6626434326171875, 0.6947021484375, 0.7267608642578125, 0.758819580078125, 0.7908782958984375, 0.82293701171875, 0.8549957275390625, 0.887054443359375, 0.9191131591796875, 0.951171875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 4.0, 8.0, 11.0, 28.0, 23.0, 43.0, 109.0, 227.0, 655.0, 2589.0, 26418.0, 838266.0, 171438.0, 6882.0, 1141.0, 406.0, 125.0, 80.0, 47.0, 20.0, 19.0, 8.0, 1.0, 5.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.197265625, -1.1595458984375, -1.121826171875, -1.0841064453125, -1.04638671875, -1.0086669921875, -0.970947265625, -0.9332275390625, -0.8955078125, -0.8577880859375, -0.820068359375, -0.7823486328125, -0.74462890625, -0.7069091796875, -0.669189453125, -0.6314697265625, -0.59375, -0.5560302734375, -0.518310546875, -0.4805908203125, -0.44287109375, -0.4051513671875, -0.367431640625, -0.3297119140625, -0.2919921875, -0.2542724609375, -0.216552734375, -0.1788330078125, -0.14111328125, -0.1033935546875, -0.065673828125, -0.0279541015625, 0.009765625, 0.0474853515625, 0.085205078125, 0.1229248046875, 0.16064453125, 0.1983642578125, 0.236083984375, 0.2738037109375, 0.3115234375, 0.3492431640625, 0.386962890625, 0.4246826171875, 0.46240234375, 0.5001220703125, 0.537841796875, 0.5755615234375, 0.61328125, 0.6510009765625, 0.688720703125, 0.7264404296875, 0.76416015625, 0.8018798828125, 0.839599609375, 0.8773193359375, 0.9150390625, 0.9527587890625, 0.990478515625, 1.0281982421875, 1.06591796875, 1.1036376953125, 1.141357421875, 1.1790771484375, 1.216796875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 3.0, 1.0, 8.0, 5.0, 5.0, 6.0, 12.0, 11.0, 15.0, 18.0, 22.0, 39.0, 46.0, 67.0, 59.0, 83.0, 91.0, 102.0, 78.0, 66.0, 54.0, 43.0, 31.0, 26.0, 25.0, 14.0, 15.0, 8.0, 20.0, 5.0, 6.0, 3.0, 2.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.779764175415039e-05, -8.535757660865784e-05, -8.291751146316528e-05, -8.047744631767273e-05, -7.803738117218018e-05, -7.559731602668762e-05, -7.315725088119507e-05, -7.071718573570251e-05, -6.827712059020996e-05, -6.583705544471741e-05, -6.339699029922485e-05, -6.09569251537323e-05, -5.8516860008239746e-05, -5.607679486274719e-05, -5.363672971725464e-05, -5.1196664571762085e-05, -4.875659942626953e-05, -4.631653428077698e-05, -4.3876469135284424e-05, -4.143640398979187e-05, -3.8996338844299316e-05, -3.655627369880676e-05, -3.411620855331421e-05, -3.1676143407821655e-05, -2.92360782623291e-05, -2.6796013116836548e-05, -2.4355947971343994e-05, -2.191588282585144e-05, -1.9475817680358887e-05, -1.7035752534866333e-05, -1.459568738937378e-05, -1.2155622243881226e-05, -9.715557098388672e-06, -7.275491952896118e-06, -4.8354268074035645e-06, -2.3953616619110107e-06, 4.470348358154297e-08, 2.4847686290740967e-06, 4.92483377456665e-06, 7.364898920059204e-06, 9.804964065551758e-06, 1.2245029211044312e-05, 1.4685094356536865e-05, 1.712515950202942e-05, 1.9565224647521973e-05, 2.2005289793014526e-05, 2.444535493850708e-05, 2.6885420083999634e-05, 2.9325485229492188e-05, 3.176555037498474e-05, 3.4205615520477295e-05, 3.664568066596985e-05, 3.90857458114624e-05, 4.1525810956954956e-05, 4.396587610244751e-05, 4.6405941247940063e-05, 4.884600639343262e-05, 5.128607153892517e-05, 5.3726136684417725e-05, 5.616620182991028e-05, 5.860626697540283e-05, 6.104633212089539e-05, 6.348639726638794e-05, 6.592646241188049e-05, 6.836652755737305e-05]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 1.0, 6.0, 8.0, 15.0, 20.0, 34.0, 64.0, 82.0, 149.0, 443.0, 2122.0, 37973.0, 971714.0, 33079.0, 2016.0, 456.0, 159.0, 89.0, 53.0, 30.0, 16.0, 12.0, 9.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-2.01171875, -1.9607696533203125, -1.909820556640625, -1.8588714599609375, -1.80792236328125, -1.7569732666015625, -1.706024169921875, -1.6550750732421875, -1.6041259765625, -1.5531768798828125, -1.502227783203125, -1.4512786865234375, -1.40032958984375, -1.3493804931640625, -1.298431396484375, -1.2474822998046875, -1.196533203125, -1.1455841064453125, -1.094635009765625, -1.0436859130859375, -0.99273681640625, -0.9417877197265625, -0.890838623046875, -0.8398895263671875, -0.7889404296875, -0.7379913330078125, -0.687042236328125, -0.6360931396484375, -0.58514404296875, -0.5341949462890625, -0.483245849609375, -0.4322967529296875, -0.38134765625, -0.3303985595703125, -0.279449462890625, -0.2285003662109375, -0.17755126953125, -0.1266021728515625, -0.075653076171875, -0.0247039794921875, 0.0262451171875, 0.0771942138671875, 0.128143310546875, 0.1790924072265625, 0.23004150390625, 0.2809906005859375, 0.331939697265625, 0.3828887939453125, 0.433837890625, 0.4847869873046875, 0.535736083984375, 0.5866851806640625, 0.63763427734375, 0.6885833740234375, 0.739532470703125, 0.7904815673828125, 0.8414306640625, 0.8923797607421875, 0.943328857421875, 0.9942779541015625, 1.04522705078125, 1.0961761474609375, 1.147125244140625, 1.1980743408203125, 1.2490234375]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 7.0, 5.0, 5.0, 10.0, 15.0, 16.0, 21.0, 23.0, 34.0, 41.0, 49.0, 51.0, 95.0, 97.0, 99.0, 75.0, 82.0, 57.0, 53.0, 40.0, 28.0, 24.0, 18.0, 13.0, 12.0, 9.0, 6.0, 7.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.426513671875, -0.4127540588378906, -0.39899444580078125, -0.3852348327636719, -0.3714752197265625, -0.3577156066894531, -0.34395599365234375, -0.3301963806152344, -0.316436767578125, -0.3026771545410156, -0.28891754150390625, -0.2751579284667969, -0.2613983154296875, -0.24763870239257812, -0.23387908935546875, -0.22011947631835938, -0.20635986328125, -0.19260025024414062, -0.17884063720703125, -0.16508102416992188, -0.1513214111328125, -0.13756179809570312, -0.12380218505859375, -0.11004257202148438, -0.096282958984375, -0.08252334594726562, -0.06876373291015625, -0.055004119873046875, -0.0412445068359375, -0.027484893798828125, -0.01372528076171875, 3.4332275390625e-05, 0.0137939453125, 0.027553558349609375, 0.04131317138671875, 0.055072784423828125, 0.0688323974609375, 0.08259201049804688, 0.09635162353515625, 0.11011123657226562, 0.123870849609375, 0.13763046264648438, 0.15139007568359375, 0.16514968872070312, 0.1789093017578125, 0.19266891479492188, 0.20642852783203125, 0.22018814086914062, 0.23394775390625, 0.24770736694335938, 0.26146697998046875, 0.2752265930175781, 0.2889862060546875, 0.3027458190917969, 0.31650543212890625, 0.3302650451660156, 0.344024658203125, 0.3577842712402344, 0.37154388427734375, 0.3853034973144531, 0.3990631103515625, 0.4128227233886719, 0.42658233642578125, 0.4403419494628906, 0.4541015625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 22.0, 34.0, 157.0, 353.0, 299.0, 110.0, 22.0, 11.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-27.736228942871094, -27.10340690612793, -26.470584869384766, -25.83776092529297, -25.204938888549805, -24.57211685180664, -23.939294815063477, -23.306472778320312, -22.67365074157715, -22.040828704833984, -21.40800666809082, -20.775184631347656, -20.14236068725586, -19.509538650512695, -18.87671661376953, -18.243894577026367, -17.611072540283203, -16.97825050354004, -16.345428466796875, -15.712605476379395, -15.07978343963623, -14.44696044921875, -13.814138412475586, -13.181316375732422, -12.548492431640625, -11.915670394897461, -11.28284740447998, -10.650025367736816, -10.017203330993652, -9.384380340576172, -8.751558303833008, -8.118736267089844, -7.48591423034668, -6.853091716766357, -6.220269680023193, -5.587447166442871, -4.954625129699707, -4.321802616119385, -3.6889801025390625, -3.0561580657958984, -2.423335552215576, -1.790513277053833, -1.1576908826828003, -0.5248684883117676, 0.10795378684997559, 0.7407760620117188, 1.373598575592041, 2.006420612335205, 2.6392431259155273, 3.2720654010772705, 3.9048876762390137, 4.537710189819336, 5.1705322265625, 5.803354740142822, 6.4361772537231445, 7.068999290466309, 7.701821804046631, 8.334644317626953, 8.967466354370117, 9.600288391113281, 10.233111381530762, 10.865933418273926, 11.498756408691406, 12.13157844543457, 12.764400482177734]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 4.0, 9.0, 7.0, 7.0, 9.0, 13.0, 10.0, 15.0, 15.0, 21.0, 20.0, 25.0, 23.0, 32.0, 40.0, 21.0, 39.0, 48.0, 56.0, 46.0, 55.0, 38.0, 45.0, 38.0, 47.0, 45.0, 37.0, 47.0, 26.0, 25.0, 23.0, 19.0, 23.0, 10.0, 11.0, 12.0, 8.0, 13.0, 5.0, 2.0, 5.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-5.246608734130859, -5.0803542137146, -4.914100170135498, -4.747845649719238, -4.581591606140137, -4.415337085723877, -4.249083042144775, -4.082828521728516, -3.916574478149414, -3.7503201961517334, -3.5840659141540527, -3.417811632156372, -3.2515573501586914, -3.0853030681610107, -2.91904878616333, -2.7527942657470703, -2.5865399837493896, -2.420285701751709, -2.2540314197540283, -2.0877771377563477, -1.921522855758667, -1.7552685737609863, -1.5890141725540161, -1.4227598905563354, -1.2565056085586548, -1.0902513265609741, -0.9239970445632935, -0.757742702960968, -0.5914884209632874, -0.4252341389656067, -0.25897979736328125, -0.09272551536560059, 0.07352876663208008, 0.23978306353092194, 0.4060373604297638, 0.5722916722297668, 0.7385459542274475, 0.9048002362251282, 1.0710545778274536, 1.2373088598251343, 1.403563141822815, 1.5698174238204956, 1.7360717058181763, 1.9023261070251465, 2.068580389022827, 2.234834671020508, 2.4010889530181885, 2.567343235015869, 2.73359751701355, 2.8998517990112305, 3.066106081008911, 3.232360363006592, 3.3986146450042725, 3.564868927001953, 3.731123447418213, 3.8973774909973145, 4.063632011413574, 4.229886531829834, 4.3961405754089355, 4.562395095825195, 4.728649139404297, 4.894903659820557, 5.061157703399658, 5.227412223815918, 5.3936662673950195]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 5.0, 3.0, 4.0, 7.0, 10.0, 20.0, 24.0, 32.0, 36.0, 54.0, 83.0, 118.0, 172.0, 266.0, 470.0, 803.0, 1684.0, 4405.0, 17388.0, 228431.0, 3874682.0, 51682.0, 8546.0, 2766.0, 1159.0, 554.0, 311.0, 162.0, 137.0, 78.0, 58.0, 37.0, 29.0, 13.0, 10.0, 17.0, 5.0, 10.0, 1.0, 3.0, 5.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0], "bins": [-2.876953125, -2.79974365234375, -2.7225341796875, -2.64532470703125, -2.568115234375, -2.49090576171875, -2.4136962890625, -2.33648681640625, -2.25927734375, -2.18206787109375, -2.1048583984375, -2.02764892578125, -1.950439453125, -1.87322998046875, -1.7960205078125, -1.71881103515625, -1.6416015625, -1.56439208984375, -1.4871826171875, -1.40997314453125, -1.332763671875, -1.25555419921875, -1.1783447265625, -1.10113525390625, -1.02392578125, -0.94671630859375, -0.8695068359375, -0.79229736328125, -0.715087890625, -0.63787841796875, -0.5606689453125, -0.48345947265625, -0.40625, -0.32904052734375, -0.2518310546875, -0.17462158203125, -0.097412109375, -0.02020263671875, 0.0570068359375, 0.13421630859375, 0.21142578125, 0.28863525390625, 0.3658447265625, 0.44305419921875, 0.520263671875, 0.59747314453125, 0.6746826171875, 0.75189208984375, 0.8291015625, 0.90631103515625, 0.9835205078125, 1.06072998046875, 1.137939453125, 1.21514892578125, 1.2923583984375, 1.36956787109375, 1.44677734375, 1.52398681640625, 1.6011962890625, 1.67840576171875, 1.755615234375, 1.83282470703125, 1.9100341796875, 1.98724365234375, 2.064453125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 7.0, 11.0, 20.0, 37.0, 52.0, 82.0, 100.0, 98.0, 144.0, 94.0, 94.0, 91.0, 55.0, 38.0, 27.0, 17.0, 6.0, 6.0, 2.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.65966796875, -0.6387786865234375, -0.617889404296875, -0.5970001220703125, -0.57611083984375, -0.5552215576171875, -0.534332275390625, -0.5134429931640625, -0.4925537109375, -0.4716644287109375, -0.450775146484375, -0.4298858642578125, -0.40899658203125, -0.3881072998046875, -0.367218017578125, -0.3463287353515625, -0.325439453125, -0.3045501708984375, -0.283660888671875, -0.2627716064453125, -0.24188232421875, -0.2209930419921875, -0.200103759765625, -0.1792144775390625, -0.1583251953125, -0.1374359130859375, -0.116546630859375, -0.0956573486328125, -0.07476806640625, -0.0538787841796875, -0.032989501953125, -0.0121002197265625, 0.0087890625, 0.0296783447265625, 0.050567626953125, 0.0714569091796875, 0.09234619140625, 0.1132354736328125, 0.134124755859375, 0.1550140380859375, 0.1759033203125, 0.1967926025390625, 0.217681884765625, 0.2385711669921875, 0.25946044921875, 0.2803497314453125, 0.301239013671875, 0.3221282958984375, 0.343017578125, 0.3639068603515625, 0.384796142578125, 0.4056854248046875, 0.42657470703125, 0.4474639892578125, 0.468353271484375, 0.4892425537109375, 0.5101318359375, 0.5310211181640625, 0.551910400390625, 0.5727996826171875, 0.59368896484375, 0.6145782470703125, 0.635467529296875, 0.6563568115234375, 0.67724609375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 3.0, 1.0, 6.0, 6.0, 9.0, 8.0, 17.0, 11.0, 27.0, 33.0, 62.0, 90.0, 108.0, 146.0, 257.0, 566.0, 1191.0, 2939.0, 9417.0, 46859.0, 3058069.0, 1022895.0, 38110.0, 8431.0, 2663.0, 1062.0, 533.0, 290.0, 156.0, 97.0, 71.0, 44.0, 32.0, 23.0, 15.0, 3.0, 9.0, 10.0, 8.0, 0.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0], "bins": [-2.34375, -2.2835693359375, -2.223388671875, -2.1632080078125, -2.10302734375, -2.0428466796875, -1.982666015625, -1.9224853515625, -1.8623046875, -1.8021240234375, -1.741943359375, -1.6817626953125, -1.62158203125, -1.5614013671875, -1.501220703125, -1.4410400390625, -1.380859375, -1.3206787109375, -1.260498046875, -1.2003173828125, -1.14013671875, -1.0799560546875, -1.019775390625, -0.9595947265625, -0.8994140625, -0.8392333984375, -0.779052734375, -0.7188720703125, -0.65869140625, -0.5985107421875, -0.538330078125, -0.4781494140625, -0.41796875, -0.3577880859375, -0.297607421875, -0.2374267578125, -0.17724609375, -0.1170654296875, -0.056884765625, 0.0032958984375, 0.0634765625, 0.1236572265625, 0.183837890625, 0.2440185546875, 0.30419921875, 0.3643798828125, 0.424560546875, 0.4847412109375, 0.544921875, 0.6051025390625, 0.665283203125, 0.7254638671875, 0.78564453125, 0.8458251953125, 0.906005859375, 0.9661865234375, 1.0263671875, 1.0865478515625, 1.146728515625, 1.2069091796875, 1.26708984375, 1.3272705078125, 1.387451171875, 1.4476318359375, 1.5078125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 5.0, 3.0, 13.0, 7.0, 29.0, 51.0, 106.0, 353.0, 2512.0, 699.0, 141.0, 69.0, 32.0, 21.0, 16.0, 8.0, 5.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.318359375, -1.2874984741210938, -1.2566375732421875, -1.2257766723632812, -1.194915771484375, -1.1640548706054688, -1.1331939697265625, -1.1023330688476562, -1.07147216796875, -1.0406112670898438, -1.0097503662109375, -0.9788894653320312, -0.948028564453125, -0.9171676635742188, -0.8863067626953125, -0.8554458618164062, -0.8245849609375, -0.7937240600585938, -0.7628631591796875, -0.7320022583007812, -0.701141357421875, -0.6702804565429688, -0.6394195556640625, -0.6085586547851562, -0.57769775390625, -0.5468368530273438, -0.5159759521484375, -0.48511505126953125, -0.454254150390625, -0.42339324951171875, -0.3925323486328125, -0.36167144775390625, -0.330810546875, -0.29994964599609375, -0.2690887451171875, -0.23822784423828125, -0.207366943359375, -0.17650604248046875, -0.1456451416015625, -0.11478424072265625, -0.08392333984375, -0.05306243896484375, -0.0222015380859375, 0.00865936279296875, 0.039520263671875, 0.07038116455078125, 0.1012420654296875, 0.13210296630859375, 0.1629638671875, 0.19382476806640625, 0.2246856689453125, 0.25554656982421875, 0.286407470703125, 0.31726837158203125, 0.3481292724609375, 0.37899017333984375, 0.40985107421875, 0.44071197509765625, 0.4715728759765625, 0.5024337768554688, 0.533294677734375, 0.5641555786132812, 0.5950164794921875, 0.6258773803710938, 0.65673828125]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 7.0, 5.0, 3.0, 10.0, 21.0, 30.0, 70.0, 102.0, 160.0, 212.0, 165.0, 108.0, 55.0, 29.0, 15.0, 9.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6022846698760986, -3.4805939197540283, -3.358903169631958, -3.2372124195098877, -3.1155216693878174, -2.993830919265747, -2.872140407562256, -2.7504496574401855, -2.6287589073181152, -2.507068157196045, -2.3853774070739746, -2.2636866569519043, -2.141995906829834, -2.0203051567077637, -1.898614525794983, -1.7769237756729126, -1.6552329063415527, -1.5335421562194824, -1.411851406097412, -1.2901606559753418, -1.1684699058532715, -1.0467791557312012, -0.9250885248184204, -0.8033977746963501, -0.6817070245742798, -0.5600162744522095, -0.43832555413246155, -0.3166348338127136, -0.1949440836906433, -0.073253333568573, 0.04843735694885254, 0.17012810707092285, 0.29181909561157227, 0.4135098457336426, 0.5352005958557129, 0.6568912863731384, 0.7785820364952087, 0.900272786617279, 1.0219634771347046, 1.143654227256775, 1.2653449773788452, 1.3870357275009155, 1.5087264776229858, 1.6304171085357666, 1.752107858657837, 1.8737986087799072, 1.9954893589019775, 2.117180109024048, 2.238870859146118, 2.3605616092681885, 2.482252359390259, 2.603943109512329, 2.7256338596343994, 2.8473246097564697, 2.969015121459961, 3.0907058715820312, 3.2123966217041016, 3.334087371826172, 3.455778121948242, 3.5774688720703125, 3.699159622192383, 3.820850372314453, 3.9425411224365234, 4.064231872558594, 4.185922622680664]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 10.0, 7.0, 13.0, 18.0, 14.0, 27.0, 42.0, 27.0, 52.0, 55.0, 53.0, 54.0, 68.0, 69.0, 73.0, 58.0, 76.0, 50.0, 49.0, 40.0, 37.0, 33.0, 15.0, 18.0, 13.0, 10.0, 4.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.4217028617858887, -2.3500778675079346, -2.2784526348114014, -2.2068276405334473, -2.135202646255493, -2.063577651977539, -1.9919524192810059, -1.9203274250030518, -1.848702311515808, -1.7770771980285645, -1.7054522037506104, -1.6338270902633667, -1.562201976776123, -1.490576982498169, -1.4189518690109253, -1.3473267555236816, -1.2757017612457275, -1.2040766477584839, -1.1324516534805298, -1.0608265399932861, -0.9892014861106873, -0.9175764322280884, -0.8459513187408447, -0.7743262648582458, -0.702701210975647, -0.6310761570930481, -0.5594511032104492, -0.48782598972320557, -0.4162009358406067, -0.3445758819580078, -0.27295079827308655, -0.20132571458816528, -0.1297008991241455, -0.05807583034038544, 0.013549238443374634, 0.0851743072271347, 0.15679937601089478, 0.22842442989349365, 0.3000495135784149, 0.3716745972633362, 0.44329965114593506, 0.5149247050285339, 0.5865497589111328, 0.6581748723983765, 0.7297999262809753, 0.8014249801635742, 0.8730500936508179, 0.9446751475334167, 1.0163002014160156, 1.0879253149032593, 1.1595503091812134, 1.231175422668457, 1.3028004169464111, 1.3744255304336548, 1.4460506439208984, 1.5176756381988525, 1.5893007516860962, 1.6609258651733398, 1.732550859451294, 1.8041759729385376, 1.8758010864257812, 1.9474260807037354, 2.0190510749816895, 2.0906763076782227, 2.1623013019561768]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 7.0, 8.0, 15.0, 27.0, 64.0, 109.0, 203.0, 468.0, 961.0, 2392.0, 9452.0, 153239.0, 830390.0, 43063.0, 5102.0, 1638.0, 729.0, 337.0, 157.0, 102.0, 29.0, 31.0, 10.0, 8.0, 10.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.390625, -4.26971435546875, -4.1488037109375, -4.02789306640625, -3.906982421875, -3.78607177734375, -3.6651611328125, -3.54425048828125, -3.42333984375, -3.30242919921875, -3.1815185546875, -3.06060791015625, -2.939697265625, -2.81878662109375, -2.6978759765625, -2.57696533203125, -2.4560546875, -2.33514404296875, -2.2142333984375, -2.09332275390625, -1.972412109375, -1.85150146484375, -1.7305908203125, -1.60968017578125, -1.48876953125, -1.36785888671875, -1.2469482421875, -1.12603759765625, -1.005126953125, -0.88421630859375, -0.7633056640625, -0.64239501953125, -0.521484375, -0.40057373046875, -0.2796630859375, -0.15875244140625, -0.037841796875, 0.08306884765625, 0.2039794921875, 0.32489013671875, 0.44580078125, 0.56671142578125, 0.6876220703125, 0.80853271484375, 0.929443359375, 1.05035400390625, 1.1712646484375, 1.29217529296875, 1.4130859375, 1.53399658203125, 1.6549072265625, 1.77581787109375, 1.896728515625, 2.01763916015625, 2.1385498046875, 2.25946044921875, 2.38037109375, 2.50128173828125, 2.6221923828125, 2.74310302734375, 2.864013671875, 2.98492431640625, 3.1058349609375, 3.22674560546875, 3.34765625]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 2.0, 2.0, 16.0, 21.0, 31.0, 70.0, 84.0, 109.0, 113.0, 135.0, 118.0, 86.0, 65.0, 52.0, 45.0, 16.0, 7.0, 10.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.7021484375, -0.6797256469726562, -0.6573028564453125, -0.6348800659179688, -0.612457275390625, -0.5900344848632812, -0.5676116943359375, -0.5451889038085938, -0.52276611328125, -0.5003433227539062, -0.4779205322265625, -0.45549774169921875, -0.433074951171875, -0.41065216064453125, -0.3882293701171875, -0.36580657958984375, -0.3433837890625, -0.32096099853515625, -0.2985382080078125, -0.27611541748046875, -0.253692626953125, -0.23126983642578125, -0.2088470458984375, -0.18642425537109375, -0.16400146484375, -0.14157867431640625, -0.1191558837890625, -0.09673309326171875, -0.074310302734375, -0.05188751220703125, -0.0294647216796875, -0.00704193115234375, 0.015380859375, 0.03780364990234375, 0.0602264404296875, 0.08264923095703125, 0.105072021484375, 0.12749481201171875, 0.1499176025390625, 0.17234039306640625, 0.19476318359375, 0.21718597412109375, 0.2396087646484375, 0.26203155517578125, 0.284454345703125, 0.30687713623046875, 0.3292999267578125, 0.35172271728515625, 0.3741455078125, 0.39656829833984375, 0.4189910888671875, 0.44141387939453125, 0.463836669921875, 0.48625946044921875, 0.5086822509765625, 0.5311050415039062, 0.55352783203125, 0.5759506225585938, 0.5983734130859375, 0.6207962036132812, 0.643218994140625, 0.6656417846679688, 0.6880645751953125, 0.7104873657226562, 0.73291015625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 6.0, 5.0, 3.0, 7.0, 3.0, 11.0, 17.0, 19.0, 21.0, 16.0, 33.0, 36.0, 65.0, 90.0, 92.0, 141.0, 225.0, 404.0, 670.0, 1503.0, 3169.0, 7527.0, 21030.0, 60498.0, 174017.0, 392050.0, 248701.0, 88130.0, 30667.0, 11111.0, 4252.0, 1885.0, 812.0, 493.0, 254.0, 153.0, 114.0, 70.0, 60.0, 55.0, 31.0, 24.0, 24.0, 21.0, 16.0, 8.0, 7.0, 5.0, 7.0, 3.0, 5.0, 1.0, 2.0, 1.0], "bins": [-0.912109375, -0.8865432739257812, -0.8609771728515625, -0.8354110717773438, -0.809844970703125, -0.7842788696289062, -0.7587127685546875, -0.7331466674804688, -0.70758056640625, -0.6820144653320312, -0.6564483642578125, -0.6308822631835938, -0.605316162109375, -0.5797500610351562, -0.5541839599609375, -0.5286178588867188, -0.5030517578125, -0.47748565673828125, -0.4519195556640625, -0.42635345458984375, -0.400787353515625, -0.37522125244140625, -0.3496551513671875, -0.32408905029296875, -0.29852294921875, -0.27295684814453125, -0.2473907470703125, -0.22182464599609375, -0.196258544921875, -0.17069244384765625, -0.1451263427734375, -0.11956024169921875, -0.093994140625, -0.06842803955078125, -0.0428619384765625, -0.01729583740234375, 0.008270263671875, 0.03383636474609375, 0.0594024658203125, 0.08496856689453125, 0.11053466796875, 0.13610076904296875, 0.1616668701171875, 0.18723297119140625, 0.212799072265625, 0.23836517333984375, 0.2639312744140625, 0.28949737548828125, 0.3150634765625, 0.34062957763671875, 0.3661956787109375, 0.39176177978515625, 0.417327880859375, 0.44289398193359375, 0.4684600830078125, 0.49402618408203125, 0.51959228515625, 0.5451583862304688, 0.5707244873046875, 0.5962905883789062, 0.621856689453125, 0.6474227905273438, 0.6729888916015625, 0.6985549926757812, 0.72412109375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 1.0, 6.0, 3.0, 4.0, 10.0, 13.0, 8.0, 12.0, 16.0, 14.0, 19.0, 18.0, 18.0, 36.0, 38.0, 35.0, 43.0, 30.0, 38.0, 36.0, 41.0, 50.0, 41.0, 35.0, 45.0, 43.0, 45.0, 34.0, 37.0, 21.0, 30.0, 26.0, 32.0, 21.0, 16.0, 19.0, 10.0, 18.0, 7.0, 9.0, 5.0, 6.0, 4.0, 3.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.9775390625, -0.9475173950195312, -0.9174957275390625, -0.8874740600585938, -0.857452392578125, -0.8274307250976562, -0.7974090576171875, -0.7673873901367188, -0.73736572265625, -0.7073440551757812, -0.6773223876953125, -0.6473007202148438, -0.617279052734375, -0.5872573852539062, -0.5572357177734375, -0.5272140502929688, -0.4971923828125, -0.46717071533203125, -0.4371490478515625, -0.40712738037109375, -0.377105712890625, -0.34708404541015625, -0.3170623779296875, -0.28704071044921875, -0.25701904296875, -0.22699737548828125, -0.1969757080078125, -0.16695404052734375, -0.136932373046875, -0.10691070556640625, -0.0768890380859375, -0.04686737060546875, -0.016845703125, 0.01317596435546875, 0.0431976318359375, 0.07321929931640625, 0.103240966796875, 0.13326263427734375, 0.1632843017578125, 0.19330596923828125, 0.22332763671875, 0.25334930419921875, 0.2833709716796875, 0.31339263916015625, 0.343414306640625, 0.37343597412109375, 0.4034576416015625, 0.43347930908203125, 0.4635009765625, 0.49352264404296875, 0.5235443115234375, 0.5535659790039062, 0.583587646484375, 0.6136093139648438, 0.6436309814453125, 0.6736526489257812, 0.70367431640625, 0.7336959838867188, 0.7637176513671875, 0.7937393188476562, 0.823760986328125, 0.8537826538085938, 0.8838043212890625, 0.9138259887695312, 0.94384765625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 0.0, 2.0, 2.0, 4.0, 5.0, 6.0, 15.0, 17.0, 19.0, 31.0, 33.0, 64.0, 84.0, 126.0, 181.0, 267.0, 475.0, 839.0, 1862.0, 5082.0, 18995.0, 104653.0, 486940.0, 347572.0, 61980.0, 12310.0, 3619.0, 1535.0, 683.0, 415.0, 259.0, 142.0, 101.0, 64.0, 51.0, 38.0, 18.0, 23.0, 13.0, 10.0, 4.0, 6.0, 5.0, 7.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.390869140625, -0.3773231506347656, -0.36377716064453125, -0.3502311706542969, -0.3366851806640625, -0.3231391906738281, -0.30959320068359375, -0.2960472106933594, -0.282501220703125, -0.2689552307128906, -0.25540924072265625, -0.24186325073242188, -0.2283172607421875, -0.21477127075195312, -0.20122528076171875, -0.18767929077148438, -0.17413330078125, -0.16058731079101562, -0.14704132080078125, -0.13349533081054688, -0.1199493408203125, -0.10640335083007812, -0.09285736083984375, -0.07931137084960938, -0.065765380859375, -0.052219390869140625, -0.03867340087890625, -0.025127410888671875, -0.0115814208984375, 0.001964569091796875, 0.01551055908203125, 0.029056549072265625, 0.0426025390625, 0.056148529052734375, 0.06969451904296875, 0.08324050903320312, 0.0967864990234375, 0.11033248901367188, 0.12387847900390625, 0.13742446899414062, 0.150970458984375, 0.16451644897460938, 0.17806243896484375, 0.19160842895507812, 0.2051544189453125, 0.21870040893554688, 0.23224639892578125, 0.24579238891601562, 0.25933837890625, 0.2728843688964844, 0.28643035888671875, 0.2999763488769531, 0.3135223388671875, 0.3270683288574219, 0.34061431884765625, 0.3541603088378906, 0.367706298828125, 0.3812522888183594, 0.39479827880859375, 0.4083442687988281, 0.4218902587890625, 0.4354362487792969, 0.44898223876953125, 0.4625282287597656, 0.47607421875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 6.0, 8.0, 12.0, 15.0, 23.0, 19.0, 22.0, 53.0, 42.0, 56.0, 77.0, 97.0, 83.0, 93.0, 80.0, 69.0, 60.0, 49.0, 35.0, 26.0, 15.0, 16.0, 11.0, 9.0, 9.0, 5.0, 7.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.367134094238281e-05, -7.12154433131218e-05, -6.875954568386078e-05, -6.630364805459976e-05, -6.384775042533875e-05, -6.139185279607773e-05, -5.893595516681671e-05, -5.6480057537555695e-05, -5.402415990829468e-05, -5.156826227903366e-05, -4.9112364649772644e-05, -4.665646702051163e-05, -4.420056939125061e-05, -4.1744671761989594e-05, -3.928877413272858e-05, -3.683287650346756e-05, -3.437697887420654e-05, -3.1921081244945526e-05, -2.946518361568451e-05, -2.7009285986423492e-05, -2.4553388357162476e-05, -2.209749072790146e-05, -1.9641593098640442e-05, -1.7185695469379425e-05, -1.4729797840118408e-05, -1.2273900210857391e-05, -9.818002581596375e-06, -7.362104952335358e-06, -4.906207323074341e-06, -2.450309693813324e-06, 5.587935447692871e-09, 2.4614855647087097e-06, 4.9173831939697266e-06, 7.373280823230743e-06, 9.82917845249176e-06, 1.2285076081752777e-05, 1.4740973711013794e-05, 1.719687134027481e-05, 1.9652768969535828e-05, 2.2108666598796844e-05, 2.456456422805786e-05, 2.7020461857318878e-05, 2.9476359486579895e-05, 3.193225711584091e-05, 3.438815474510193e-05, 3.6844052374362946e-05, 3.929995000362396e-05, 4.175584763288498e-05, 4.4211745262145996e-05, 4.666764289140701e-05, 4.912354052066803e-05, 5.157943814992905e-05, 5.4035335779190063e-05, 5.649123340845108e-05, 5.89471310377121e-05, 6.140302866697311e-05, 6.385892629623413e-05, 6.631482392549515e-05, 6.877072155475616e-05, 7.122661918401718e-05, 7.36825168132782e-05, 7.613841444253922e-05, 7.859431207180023e-05, 8.105020970106125e-05, 8.350610733032227e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 6.0, 8.0, 13.0, 17.0, 26.0, 51.0, 74.0, 108.0, 206.0, 422.0, 885.0, 2104.0, 6383.0, 31648.0, 257637.0, 625006.0, 102358.0, 14954.0, 3862.0, 1447.0, 640.0, 296.0, 156.0, 96.0, 57.0, 30.0, 23.0, 10.0, 10.0, 7.0, 3.0, 4.0, 4.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4482421875, -0.43181610107421875, -0.4153900146484375, -0.39896392822265625, -0.382537841796875, -0.36611175537109375, -0.3496856689453125, -0.33325958251953125, -0.31683349609375, -0.30040740966796875, -0.2839813232421875, -0.26755523681640625, -0.251129150390625, -0.23470306396484375, -0.2182769775390625, -0.20185089111328125, -0.1854248046875, -0.16899871826171875, -0.1525726318359375, -0.13614654541015625, -0.119720458984375, -0.10329437255859375, -0.0868682861328125, -0.07044219970703125, -0.05401611328125, -0.03759002685546875, -0.0211639404296875, -0.00473785400390625, 0.011688232421875, 0.02811431884765625, 0.0445404052734375, 0.06096649169921875, 0.077392578125, 0.09381866455078125, 0.1102447509765625, 0.12667083740234375, 0.143096923828125, 0.15952301025390625, 0.1759490966796875, 0.19237518310546875, 0.20880126953125, 0.22522735595703125, 0.2416534423828125, 0.25807952880859375, 0.274505615234375, 0.29093170166015625, 0.3073577880859375, 0.32378387451171875, 0.3402099609375, 0.35663604736328125, 0.3730621337890625, 0.38948822021484375, 0.405914306640625, 0.42234039306640625, 0.4387664794921875, 0.45519256591796875, 0.47161865234375, 0.48804473876953125, 0.5044708251953125, 0.5208969116210938, 0.537322998046875, 0.5537490844726562, 0.5701751708984375, 0.5866012573242188, 0.60302734375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 5.0, 3.0, 9.0, 6.0, 17.0, 14.0, 22.0, 27.0, 29.0, 41.0, 45.0, 56.0, 81.0, 84.0, 75.0, 87.0, 80.0, 80.0, 52.0, 48.0, 34.0, 23.0, 23.0, 15.0, 17.0, 9.0, 3.0, 4.0, 5.0, 2.0, 0.0, 2.0, 4.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.37548828125, -0.36331939697265625, -0.3511505126953125, -0.33898162841796875, -0.326812744140625, -0.31464385986328125, -0.3024749755859375, -0.29030609130859375, -0.27813720703125, -0.26596832275390625, -0.2537994384765625, -0.24163055419921875, -0.229461669921875, -0.21729278564453125, -0.2051239013671875, -0.19295501708984375, -0.1807861328125, -0.16861724853515625, -0.1564483642578125, -0.14427947998046875, -0.132110595703125, -0.11994171142578125, -0.1077728271484375, -0.09560394287109375, -0.08343505859375, -0.07126617431640625, -0.0590972900390625, -0.04692840576171875, -0.034759521484375, -0.02259063720703125, -0.0104217529296875, 0.00174713134765625, 0.013916015625, 0.02608489990234375, 0.0382537841796875, 0.05042266845703125, 0.062591552734375, 0.07476043701171875, 0.0869293212890625, 0.09909820556640625, 0.11126708984375, 0.12343597412109375, 0.1356048583984375, 0.14777374267578125, 0.159942626953125, 0.17211151123046875, 0.1842803955078125, 0.19644927978515625, 0.2086181640625, 0.22078704833984375, 0.2329559326171875, 0.24512481689453125, 0.257293701171875, 0.26946258544921875, 0.2816314697265625, 0.29380035400390625, 0.30596923828125, 0.31813812255859375, 0.3303070068359375, 0.34247589111328125, 0.354644775390625, 0.36681365966796875, 0.3789825439453125, 0.39115142822265625, 0.4033203125]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 4.0, 4.0, 14.0, 13.0, 15.0, 31.0, 33.0, 51.0, 51.0, 92.0, 105.0, 117.0, 94.0, 97.0, 81.0, 67.0, 46.0, 35.0, 28.0, 11.0, 10.0, 8.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-8.698837280273438, -8.522096633911133, -8.345356941223145, -8.16861629486084, -7.991876602172852, -7.815136432647705, -7.638396263122559, -7.461655616760254, -7.284915924072266, -7.108175754547119, -6.931435585021973, -6.754695415496826, -6.57795524597168, -6.401215076446533, -6.224474906921387, -6.047734260559082, -5.8709940910339355, -5.694253921508789, -5.517513751983643, -5.340773582458496, -5.16403341293335, -4.987293243408203, -4.810552597045898, -4.63381290435791, -4.4570722579956055, -4.280332088470459, -4.1035919189453125, -3.926851749420166, -3.7501115798950195, -3.573371410369873, -3.3966310024261475, -3.219890832901001, -3.0431504249572754, -2.866410255432129, -2.6896700859069824, -2.512929916381836, -2.3361897468566895, -2.159449577331543, -1.9827091693878174, -1.805968999862671, -1.6292288303375244, -1.452488660812378, -1.2757484912872314, -1.0990082025527954, -0.9222680330276489, -0.7455278635025024, -0.5687875747680664, -0.3920474052429199, -0.21530723571777344, -0.038567036390304565, 0.1381731629371643, 0.31491339206695557, 0.49165356159210205, 0.6683937311172485, 0.8451340198516846, 1.021874189376831, 1.1986143589019775, 1.375354528427124, 1.5520946979522705, 1.7288349866867065, 1.905575156211853, 2.082315444946289, 2.2590556144714355, 2.435795783996582, 2.6125359535217285]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 6.0, 2.0, 4.0, 6.0, 4.0, 7.0, 7.0, 16.0, 12.0, 13.0, 24.0, 26.0, 16.0, 23.0, 38.0, 24.0, 30.0, 42.0, 32.0, 48.0, 41.0, 45.0, 56.0, 49.0, 44.0, 34.0, 44.0, 37.0, 42.0, 36.0, 30.0, 21.0, 21.0, 25.0, 18.0, 15.0, 10.0, 15.0, 15.0, 13.0, 7.0, 6.0, 2.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-5.717818260192871, -5.5656938552856445, -5.413569450378418, -5.261444568634033, -5.109320163726807, -4.95719575881958, -4.805070877075195, -4.652946472167969, -4.500822067260742, -4.348697662353516, -4.196573257446289, -4.044448375701904, -3.8923239707946777, -3.740199565887451, -3.5880749225616455, -3.43595027923584, -3.2838258743286133, -3.1317014694213867, -2.979576826095581, -2.8274521827697754, -2.675327777862549, -2.5232033729553223, -2.3710787296295166, -2.218954086303711, -2.0668296813964844, -1.9147051572799683, -1.7625806331634521, -1.610456109046936, -1.45833158493042, -1.3062070608139038, -1.1540825366973877, -1.0019580125808716, -0.8498339653015137, -0.6977094411849976, -0.5455849170684814, -0.39346039295196533, -0.24133586883544922, -0.0892113447189331, 0.06291317939758301, 0.21503770351409912, 0.36716222763061523, 0.5192867517471313, 0.6714112758636475, 0.8235357999801636, 0.9756603240966797, 1.1277848482131958, 1.279909372329712, 1.432033896446228, 1.5841584205627441, 1.7362829446792603, 1.8884074687957764, 2.040532112121582, 2.1926565170288086, 2.344780921936035, 2.496905565261841, 2.6490302085876465, 2.801154613494873, 2.9532790184020996, 3.1054036617279053, 3.257528305053711, 3.4096527099609375, 3.561777114868164, 3.7139017581939697, 3.8660264015197754, 4.018150806427002]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 7.0, 9.0, 9.0, 22.0, 19.0, 27.0, 42.0, 71.0, 122.0, 173.0, 309.0, 662.0, 1754.0, 6957.0, 82158.0, 4066714.0, 28721.0, 4225.0, 1191.0, 485.0, 238.0, 130.0, 85.0, 52.0, 29.0, 17.0, 14.0, 8.0, 12.0, 5.0, 5.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.46875, -5.3046875, -5.140625, -4.9765625, -4.8125, -4.6484375, -4.484375, -4.3203125, -4.15625, -3.9921875, -3.828125, -3.6640625, -3.5, -3.3359375, -3.171875, -3.0078125, -2.84375, -2.6796875, -2.515625, -2.3515625, -2.1875, -2.0234375, -1.859375, -1.6953125, -1.53125, -1.3671875, -1.203125, -1.0390625, -0.875, -0.7109375, -0.546875, -0.3828125, -0.21875, -0.0546875, 0.109375, 0.2734375, 0.4375, 0.6015625, 0.765625, 0.9296875, 1.09375, 1.2578125, 1.421875, 1.5859375, 1.75, 1.9140625, 2.078125, 2.2421875, 2.40625, 2.5703125, 2.734375, 2.8984375, 3.0625, 3.2265625, 3.390625, 3.5546875, 3.71875, 3.8828125, 4.046875, 4.2109375, 4.375, 4.5390625, 4.703125, 4.8671875, 5.03125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 1.0, 2.0, 5.0, 15.0, 24.0, 37.0, 60.0, 81.0, 117.0, 118.0, 120.0, 96.0, 89.0, 65.0, 66.0, 28.0, 30.0, 10.0, 13.0, 7.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.7236328125, -0.7012786865234375, -0.678924560546875, -0.6565704345703125, -0.63421630859375, -0.6118621826171875, -0.589508056640625, -0.5671539306640625, -0.5447998046875, -0.5224456787109375, -0.500091552734375, -0.4777374267578125, -0.45538330078125, -0.4330291748046875, -0.410675048828125, -0.3883209228515625, -0.365966796875, -0.3436126708984375, -0.321258544921875, -0.2989044189453125, -0.27655029296875, -0.2541961669921875, -0.231842041015625, -0.2094879150390625, -0.1871337890625, -0.1647796630859375, -0.142425537109375, -0.1200714111328125, -0.09771728515625, -0.0753631591796875, -0.053009033203125, -0.0306549072265625, -0.00830078125, 0.0140533447265625, 0.036407470703125, 0.0587615966796875, 0.08111572265625, 0.1034698486328125, 0.125823974609375, 0.1481781005859375, 0.1705322265625, 0.1928863525390625, 0.215240478515625, 0.2375946044921875, 0.25994873046875, 0.2823028564453125, 0.304656982421875, 0.3270111083984375, 0.349365234375, 0.3717193603515625, 0.394073486328125, 0.4164276123046875, 0.43878173828125, 0.4611358642578125, 0.483489990234375, 0.5058441162109375, 0.5281982421875, 0.5505523681640625, 0.572906494140625, 0.5952606201171875, 0.61761474609375, 0.6399688720703125, 0.662322998046875, 0.6846771240234375, 0.70703125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 5.0, 3.0, 13.0, 16.0, 12.0, 22.0, 35.0, 31.0, 47.0, 70.0, 105.0, 113.0, 198.0, 239.0, 377.0, 571.0, 820.0, 1418.0, 2434.0, 5533.0, 16340.0, 83085.0, 3706939.0, 324832.0, 33326.0, 8895.0, 3742.0, 1781.0, 1091.0, 661.0, 436.0, 305.0, 198.0, 156.0, 122.0, 83.0, 65.0, 42.0, 32.0, 27.0, 20.0, 15.0, 8.0, 8.0, 5.0, 3.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.8876953125, -1.8282318115234375, -1.768768310546875, -1.7093048095703125, -1.64984130859375, -1.5903778076171875, -1.530914306640625, -1.4714508056640625, -1.4119873046875, -1.3525238037109375, -1.293060302734375, -1.2335968017578125, -1.17413330078125, -1.1146697998046875, -1.055206298828125, -0.9957427978515625, -0.936279296875, -0.8768157958984375, -0.817352294921875, -0.7578887939453125, -0.69842529296875, -0.6389617919921875, -0.579498291015625, -0.5200347900390625, -0.4605712890625, -0.4011077880859375, -0.341644287109375, -0.2821807861328125, -0.22271728515625, -0.1632537841796875, -0.103790283203125, -0.0443267822265625, 0.01513671875, 0.0746002197265625, 0.134063720703125, 0.1935272216796875, 0.25299072265625, 0.3124542236328125, 0.371917724609375, 0.4313812255859375, 0.4908447265625, 0.5503082275390625, 0.609771728515625, 0.6692352294921875, 0.72869873046875, 0.7881622314453125, 0.847625732421875, 0.9070892333984375, 0.966552734375, 1.0260162353515625, 1.085479736328125, 1.1449432373046875, 1.20440673828125, 1.2638702392578125, 1.323333740234375, 1.3827972412109375, 1.4422607421875, 1.5017242431640625, 1.561187744140625, 1.6206512451171875, 1.68011474609375, 1.7395782470703125, 1.799041748046875, 1.8585052490234375, 1.91796875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 2.0, 8.0, 6.0, 18.0, 22.0, 59.0, 175.0, 2627.0, 889.0, 152.0, 53.0, 25.0, 15.0, 8.0, 2.0, 2.0, 4.0, 6.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.458984375, -1.4171600341796875, -1.375335693359375, -1.3335113525390625, -1.29168701171875, -1.2498626708984375, -1.208038330078125, -1.1662139892578125, -1.1243896484375, -1.0825653076171875, -1.040740966796875, -0.9989166259765625, -0.95709228515625, -0.9152679443359375, -0.873443603515625, -0.8316192626953125, -0.789794921875, -0.7479705810546875, -0.706146240234375, -0.6643218994140625, -0.62249755859375, -0.5806732177734375, -0.538848876953125, -0.4970245361328125, -0.4552001953125, -0.4133758544921875, -0.371551513671875, -0.3297271728515625, -0.28790283203125, -0.2460784912109375, -0.204254150390625, -0.1624298095703125, -0.12060546875, -0.0787811279296875, -0.036956787109375, 0.0048675537109375, 0.04669189453125, 0.0885162353515625, 0.130340576171875, 0.1721649169921875, 0.2139892578125, 0.2558135986328125, 0.297637939453125, 0.3394622802734375, 0.38128662109375, 0.4231109619140625, 0.464935302734375, 0.5067596435546875, 0.548583984375, 0.5904083251953125, 0.632232666015625, 0.6740570068359375, 0.71588134765625, 0.7577056884765625, 0.799530029296875, 0.8413543701171875, 0.8831787109375, 0.9250030517578125, 0.966827392578125, 1.0086517333984375, 1.05047607421875, 1.0923004150390625, 1.134124755859375, 1.1759490966796875, 1.2177734375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 6.0, 4.0, 4.0, 8.0, 25.0, 48.0, 128.0, 226.0, 237.0, 155.0, 91.0, 25.0, 22.0, 13.0, 7.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4178354740142822, -3.2553305625915527, -3.092825412750244, -2.9303205013275146, -2.767815589904785, -2.6053104400634766, -2.442805528640747, -2.2803006172180176, -2.117795467376709, -1.95529043674469, -1.7927855253219604, -1.6302804946899414, -1.467775583267212, -1.3052705526351929, -1.1427655220031738, -0.9802606105804443, -0.8177556991577148, -0.6552507281303406, -0.4927457273006439, -0.33024072647094727, -0.167735755443573, -0.0052307844161987305, 0.1572742462158203, 0.3197791576385498, 0.48228418827056885, 0.6447891592979431, 0.8072941303253174, 0.9697991609573364, 1.1323041915893555, 1.294809103012085, 1.457314133644104, 1.6198190450668335, 1.7823243141174316, 1.9448293447494507, 2.1073343753814697, 2.269839286804199, 2.4323441982269287, 2.594849109649658, 2.757354259490967, 2.9198591709136963, 3.082364082336426, 3.2448689937591553, 3.407374143600464, 3.5698790550231934, 3.732383966445923, 3.8948888778686523, 4.057394027709961, 4.2198991775512695, 4.382404327392578, 4.544909477233887, 4.707414150238037, 4.869919300079346, 5.032424449920654, 5.194929122924805, 5.357434272766113, 5.519939422607422, 5.682444095611572, 5.844949245452881, 6.007453918457031, 6.16995906829834, 6.332464218139648, 6.494968891143799, 6.657474040985107, 6.819978713989258, 6.982483863830566]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 9.0, 12.0, 7.0, 34.0, 40.0, 43.0, 60.0, 63.0, 80.0, 75.0, 91.0, 77.0, 91.0, 90.0, 54.0, 43.0, 38.0, 27.0, 16.0, 12.0, 9.0, 10.0, 5.0, 2.0, 2.0, 5.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.9185948371887207, -3.8101539611816406, -3.7017130851745605, -3.5932722091674805, -3.4848310947418213, -3.376390218734741, -3.267949342727661, -3.159508466720581, -3.051067352294922, -2.942626476287842, -2.8341856002807617, -2.7257447242736816, -2.6173036098480225, -2.5088627338409424, -2.4004218578338623, -2.2919809818267822, -2.183540105819702, -2.075099229812622, -1.9666582345962524, -1.8582173585891724, -1.7497763633728027, -1.6413354873657227, -1.5328946113586426, -1.4244537353515625, -1.3160127401351929, -1.2075718641281128, -1.0991308689117432, -0.9906899929046631, -0.8822490572929382, -0.7738081216812134, -0.6653672456741333, -0.5569263100624084, -0.4484851360321045, -0.34004420042037964, -0.23160329461097717, -0.12316238880157471, -0.014721453189849854, 0.093719482421875, 0.20216035842895508, 0.31060129404067993, 0.4190422296524048, 0.5274831652641296, 0.6359241008758545, 0.7443649768829346, 0.8528059124946594, 0.9612468481063843, 1.0696877241134644, 1.178128719329834, 1.286569595336914, 1.3950104713439941, 1.5034514665603638, 1.6118923425674438, 1.7203333377838135, 1.8287742137908936, 1.9372150897979736, 2.0456559658050537, 2.154097080230713, 2.262537956237793, 2.370978832244873, 2.479419708251953, 2.5878608226776123, 2.6963016986846924, 2.8047425746917725, 2.9131834506988525, 3.0216243267059326]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 4.0, 7.0, 15.0, 18.0, 28.0, 48.0, 86.0, 173.0, 252.0, 495.0, 1006.0, 2052.0, 5512.0, 30889.0, 399416.0, 552925.0, 43886.0, 6976.0, 2405.0, 1074.0, 601.0, 287.0, 161.0, 89.0, 73.0, 36.0, 13.0, 9.0, 5.0, 6.0, 4.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.103515625, -3.000335693359375, -2.89715576171875, -2.793975830078125, -2.6907958984375, -2.587615966796875, -2.48443603515625, -2.381256103515625, -2.278076171875, -2.174896240234375, -2.07171630859375, -1.968536376953125, -1.8653564453125, -1.762176513671875, -1.65899658203125, -1.555816650390625, -1.45263671875, -1.349456787109375, -1.24627685546875, -1.143096923828125, -1.0399169921875, -0.936737060546875, -0.83355712890625, -0.730377197265625, -0.627197265625, -0.524017333984375, -0.42083740234375, -0.317657470703125, -0.2144775390625, -0.111297607421875, -0.00811767578125, 0.095062255859375, 0.1982421875, 0.301422119140625, 0.40460205078125, 0.507781982421875, 0.6109619140625, 0.714141845703125, 0.81732177734375, 0.920501708984375, 1.023681640625, 1.126861572265625, 1.23004150390625, 1.333221435546875, 1.4364013671875, 1.539581298828125, 1.64276123046875, 1.745941162109375, 1.84912109375, 1.952301025390625, 2.05548095703125, 2.158660888671875, 2.2618408203125, 2.365020751953125, 2.46820068359375, 2.571380615234375, 2.674560546875, 2.777740478515625, 2.88092041015625, 2.984100341796875, 3.0872802734375, 3.190460205078125, 3.29364013671875, 3.396820068359375, 3.5]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 11.0, 17.0, 18.0, 53.0, 62.0, 94.0, 129.0, 111.0, 123.0, 84.0, 74.0, 73.0, 45.0, 46.0, 17.0, 15.0, 3.0, 9.0, 1.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.77978515625, -0.7555084228515625, -0.731231689453125, -0.7069549560546875, -0.68267822265625, -0.6584014892578125, -0.634124755859375, -0.6098480224609375, -0.5855712890625, -0.5612945556640625, -0.537017822265625, -0.5127410888671875, -0.48846435546875, -0.4641876220703125, -0.439910888671875, -0.4156341552734375, -0.391357421875, -0.3670806884765625, -0.342803955078125, -0.3185272216796875, -0.29425048828125, -0.2699737548828125, -0.245697021484375, -0.2214202880859375, -0.1971435546875, -0.1728668212890625, -0.148590087890625, -0.1243133544921875, -0.10003662109375, -0.0757598876953125, -0.051483154296875, -0.0272064208984375, -0.0029296875, 0.0213470458984375, 0.045623779296875, 0.0699005126953125, 0.09417724609375, 0.1184539794921875, 0.142730712890625, 0.1670074462890625, 0.1912841796875, 0.2155609130859375, 0.239837646484375, 0.2641143798828125, 0.28839111328125, 0.3126678466796875, 0.336944580078125, 0.3612213134765625, 0.385498046875, 0.4097747802734375, 0.434051513671875, 0.4583282470703125, 0.48260498046875, 0.5068817138671875, 0.531158447265625, 0.5554351806640625, 0.5797119140625, 0.6039886474609375, 0.628265380859375, 0.6525421142578125, 0.67681884765625, 0.7010955810546875, 0.725372314453125, 0.7496490478515625, 0.77392578125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 4.0, 10.0, 7.0, 6.0, 18.0, 23.0, 37.0, 51.0, 72.0, 94.0, 164.0, 249.0, 436.0, 820.0, 1561.0, 3123.0, 7368.0, 18734.0, 56279.0, 181777.0, 408451.0, 248042.0, 78771.0, 25104.0, 9307.0, 3910.0, 1856.0, 913.0, 490.0, 327.0, 196.0, 117.0, 65.0, 60.0, 34.0, 25.0, 20.0, 13.0, 6.0, 5.0, 4.0, 6.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9912109375, -0.9598846435546875, -0.928558349609375, -0.8972320556640625, -0.86590576171875, -0.8345794677734375, -0.803253173828125, -0.7719268798828125, -0.7406005859375, -0.7092742919921875, -0.677947998046875, -0.6466217041015625, -0.61529541015625, -0.5839691162109375, -0.552642822265625, -0.5213165283203125, -0.489990234375, -0.4586639404296875, -0.427337646484375, -0.3960113525390625, -0.36468505859375, -0.3333587646484375, -0.302032470703125, -0.2707061767578125, -0.2393798828125, -0.2080535888671875, -0.176727294921875, -0.1454010009765625, -0.11407470703125, -0.0827484130859375, -0.051422119140625, -0.0200958251953125, 0.01123046875, 0.0425567626953125, 0.073883056640625, 0.1052093505859375, 0.13653564453125, 0.1678619384765625, 0.199188232421875, 0.2305145263671875, 0.2618408203125, 0.2931671142578125, 0.324493408203125, 0.3558197021484375, 0.38714599609375, 0.4184722900390625, 0.449798583984375, 0.4811248779296875, 0.512451171875, 0.5437774658203125, 0.575103759765625, 0.6064300537109375, 0.63775634765625, 0.6690826416015625, 0.700408935546875, 0.7317352294921875, 0.7630615234375, 0.7943878173828125, 0.825714111328125, 0.8570404052734375, 0.88836669921875, 0.9196929931640625, 0.951019287109375, 0.9823455810546875, 1.013671875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 6.0, 2.0, 1.0, 5.0, 9.0, 9.0, 11.0, 9.0, 7.0, 17.0, 17.0, 17.0, 30.0, 36.0, 27.0, 28.0, 49.0, 54.0, 51.0, 63.0, 46.0, 63.0, 58.0, 47.0, 45.0, 49.0, 34.0, 35.0, 32.0, 33.0, 28.0, 16.0, 9.0, 15.0, 14.0, 7.0, 8.0, 6.0, 6.0, 4.0, 1.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.474609375, -1.42730712890625, -1.3800048828125, -1.33270263671875, -1.285400390625, -1.23809814453125, -1.1907958984375, -1.14349365234375, -1.09619140625, -1.04888916015625, -1.0015869140625, -0.95428466796875, -0.906982421875, -0.85968017578125, -0.8123779296875, -0.76507568359375, -0.7177734375, -0.67047119140625, -0.6231689453125, -0.57586669921875, -0.528564453125, -0.48126220703125, -0.4339599609375, -0.38665771484375, -0.33935546875, -0.29205322265625, -0.2447509765625, -0.19744873046875, -0.150146484375, -0.10284423828125, -0.0555419921875, -0.00823974609375, 0.0390625, 0.08636474609375, 0.1336669921875, 0.18096923828125, 0.228271484375, 0.27557373046875, 0.3228759765625, 0.37017822265625, 0.41748046875, 0.46478271484375, 0.5120849609375, 0.55938720703125, 0.606689453125, 0.65399169921875, 0.7012939453125, 0.74859619140625, 0.7958984375, 0.84320068359375, 0.8905029296875, 0.93780517578125, 0.985107421875, 1.03240966796875, 1.0797119140625, 1.12701416015625, 1.17431640625, 1.22161865234375, 1.2689208984375, 1.31622314453125, 1.363525390625, 1.41082763671875, 1.4581298828125, 1.50543212890625, 1.552734375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 3.0, 7.0, 18.0, 34.0, 61.0, 146.0, 379.0, 1474.0, 11004.0, 594144.0, 430626.0, 8683.0, 1307.0, 406.0, 147.0, 54.0, 34.0, 12.0, 4.0, 2.0, 1.0, 1.0, 2.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.048828125, -2.0, -1.951171875, -1.90234375, -1.853515625, -1.8046875, -1.755859375, -1.70703125, -1.658203125, -1.609375, -1.560546875, -1.51171875, -1.462890625, -1.4140625, -1.365234375, -1.31640625, -1.267578125, -1.21875, -1.169921875, -1.12109375, -1.072265625, -1.0234375, -0.974609375, -0.92578125, -0.876953125, -0.828125, -0.779296875, -0.73046875, -0.681640625, -0.6328125, -0.583984375, -0.53515625, -0.486328125, -0.4375, -0.388671875, -0.33984375, -0.291015625, -0.2421875, -0.193359375, -0.14453125, -0.095703125, -0.046875, 0.001953125, 0.05078125, 0.099609375, 0.1484375, 0.197265625, 0.24609375, 0.294921875, 0.34375, 0.392578125, 0.44140625, 0.490234375, 0.5390625, 0.587890625, 0.63671875, 0.685546875, 0.734375, 0.783203125, 0.83203125, 0.880859375, 0.9296875, 0.978515625, 1.02734375, 1.076171875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 5.0, 2.0, 4.0, 9.0, 15.0, 14.0, 31.0, 46.0, 75.0, 120.0, 139.0, 162.0, 129.0, 97.0, 58.0, 41.0, 21.0, 13.0, 8.0, 5.0, 8.0, 3.0, 0.0, 2.0, 3.0, 2.0, 1.0], "bins": [-0.00021147727966308594, -0.0002070888876914978, -0.00020270049571990967, -0.00019831210374832153, -0.0001939237117767334, -0.00018953531980514526, -0.00018514692783355713, -0.000180758535861969, -0.00017637014389038086, -0.00017198175191879272, -0.0001675933599472046, -0.00016320496797561646, -0.00015881657600402832, -0.00015442818403244019, -0.00015003979206085205, -0.00014565140008926392, -0.00014126300811767578, -0.00013687461614608765, -0.0001324862241744995, -0.00012809783220291138, -0.00012370944023132324, -0.00011932104825973511, -0.00011493265628814697, -0.00011054426431655884, -0.0001061558723449707, -0.00010176748037338257, -9.737908840179443e-05, -9.29906964302063e-05, -8.860230445861816e-05, -8.421391248703003e-05, -7.98255205154419e-05, -7.543712854385376e-05, -7.104873657226562e-05, -6.666034460067749e-05, -6.227195262908936e-05, -5.788356065750122e-05, -5.3495168685913086e-05, -4.910677671432495e-05, -4.4718384742736816e-05, -4.032999277114868e-05, -3.594160079956055e-05, -3.155320882797241e-05, -2.7164816856384277e-05, -2.2776424884796143e-05, -1.8388032913208008e-05, -1.3999640941619873e-05, -9.611248970031738e-06, -5.2228569984436035e-06, -8.344650268554688e-07, 3.553926944732666e-06, 7.9423189163208e-06, 1.2330710887908936e-05, 1.671910285949707e-05, 2.1107494831085205e-05, 2.549588680267334e-05, 2.9884278774261475e-05, 3.427267074584961e-05, 3.8661062717437744e-05, 4.304945468902588e-05, 4.7437846660614014e-05, 5.182623863220215e-05, 5.621463060379028e-05, 6.060302257537842e-05, 6.499141454696655e-05, 6.937980651855469e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 6.0, 11.0, 9.0, 18.0, 37.0, 37.0, 77.0, 159.0, 360.0, 1071.0, 3927.0, 21570.0, 225159.0, 702962.0, 79484.0, 10226.0, 2212.0, 684.0, 249.0, 114.0, 69.0, 36.0, 23.0, 21.0, 13.0, 10.0, 8.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.77099609375, -0.7437515258789062, -0.7165069580078125, -0.6892623901367188, -0.662017822265625, -0.6347732543945312, -0.6075286865234375, -0.5802841186523438, -0.55303955078125, -0.5257949829101562, -0.4985504150390625, -0.47130584716796875, -0.444061279296875, -0.41681671142578125, -0.3895721435546875, -0.36232757568359375, -0.3350830078125, -0.30783843994140625, -0.2805938720703125, -0.25334930419921875, -0.226104736328125, -0.19886016845703125, -0.1716156005859375, -0.14437103271484375, -0.11712646484375, -0.08988189697265625, -0.0626373291015625, -0.03539276123046875, -0.008148193359375, 0.01909637451171875, 0.0463409423828125, 0.07358551025390625, 0.100830078125, 0.12807464599609375, 0.1553192138671875, 0.18256378173828125, 0.209808349609375, 0.23705291748046875, 0.2642974853515625, 0.29154205322265625, 0.31878662109375, 0.34603118896484375, 0.3732757568359375, 0.40052032470703125, 0.427764892578125, 0.45500946044921875, 0.4822540283203125, 0.5094985961914062, 0.5367431640625, 0.5639877319335938, 0.5912322998046875, 0.6184768676757812, 0.645721435546875, 0.6729660034179688, 0.7002105712890625, 0.7274551391601562, 0.75469970703125, 0.7819442749023438, 0.8091888427734375, 0.8364334106445312, 0.863677978515625, 0.8909225463867188, 0.9181671142578125, 0.9454116821289062, 0.97265625]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 7.0, 13.0, 23.0, 21.0, 31.0, 56.0, 74.0, 112.0, 156.0, 132.0, 112.0, 90.0, 54.0, 46.0, 16.0, 18.0, 13.0, 12.0, 3.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2978515625, -1.268402099609375, -1.23895263671875, -1.209503173828125, -1.1800537109375, -1.150604248046875, -1.12115478515625, -1.091705322265625, -1.062255859375, -1.032806396484375, -1.00335693359375, -0.973907470703125, -0.9444580078125, -0.915008544921875, -0.88555908203125, -0.856109619140625, -0.82666015625, -0.797210693359375, -0.76776123046875, -0.738311767578125, -0.7088623046875, -0.679412841796875, -0.64996337890625, -0.620513916015625, -0.591064453125, -0.561614990234375, -0.53216552734375, -0.502716064453125, -0.4732666015625, -0.443817138671875, -0.41436767578125, -0.384918212890625, -0.35546875, -0.326019287109375, -0.29656982421875, -0.267120361328125, -0.2376708984375, -0.208221435546875, -0.17877197265625, -0.149322509765625, -0.119873046875, -0.090423583984375, -0.06097412109375, -0.031524658203125, -0.0020751953125, 0.027374267578125, 0.05682373046875, 0.086273193359375, 0.11572265625, 0.145172119140625, 0.17462158203125, 0.204071044921875, 0.2335205078125, 0.262969970703125, 0.29241943359375, 0.321868896484375, 0.351318359375, 0.380767822265625, 0.41021728515625, 0.439666748046875, 0.4691162109375, 0.498565673828125, 0.52801513671875, 0.557464599609375, 0.5869140625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 14.0, 31.0, 98.0, 293.0, 369.0, 149.0, 45.0, 8.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-48.15915298461914, -47.269290924072266, -46.379432678222656, -45.48957061767578, -44.59971237182617, -43.7098503112793, -42.81999206542969, -41.93013000488281, -41.04026794433594, -40.15040588378906, -39.26054763793945, -38.37068557739258, -37.48082733154297, -36.590965270996094, -35.701107025146484, -34.81124496459961, -33.92138671875, -33.031524658203125, -32.141666412353516, -31.251806259155273, -30.36194610595703, -29.472084045410156, -28.582223892211914, -27.692363739013672, -26.80250358581543, -25.912643432617188, -25.022783279418945, -24.132923126220703, -23.243061065673828, -22.35320281982422, -21.463340759277344, -20.5734806060791, -19.683622360229492, -18.79376220703125, -17.903902053833008, -17.014041900634766, -16.12417984008789, -15.234320640563965, -14.344459533691406, -13.454599380493164, -12.564739227294922, -11.67487907409668, -10.785018920898438, -9.895157814025879, -9.005297660827637, -8.115437507629395, -7.225576877593994, -6.335716247558594, -5.445856094360352, -4.555995941162109, -3.666135311126709, -2.7762749195098877, -1.8864145278930664, -0.9965543746948242, -0.10669374465942383, 0.7831668853759766, 1.6730270385742188, 2.56288743019104, 3.4527478218078613, 4.342608451843262, 5.232468605041504, 6.122328758239746, 7.0121893882751465, 7.902050018310547, 8.791910171508789]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 1.0, 2.0, 4.0, 2.0, 6.0, 5.0, 7.0, 5.0, 9.0, 15.0, 12.0, 18.0, 19.0, 17.0, 17.0, 25.0, 26.0, 21.0, 31.0, 35.0, 44.0, 41.0, 37.0, 32.0, 42.0, 42.0, 40.0, 45.0, 44.0, 37.0, 35.0, 39.0, 36.0, 30.0, 26.0, 22.0, 20.0, 16.0, 16.0, 12.0, 18.0, 11.0, 7.0, 6.0, 8.0, 6.0, 4.0, 4.0, 2.0, 5.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 2.0], "bins": [-7.000665187835693, -6.785818099975586, -6.5709710121154785, -6.356123924255371, -6.141276836395264, -5.926429748535156, -5.711583137512207, -5.4967360496521, -5.281888961791992, -5.067041873931885, -4.852194786071777, -4.63734769821167, -4.4225006103515625, -4.207653999328613, -3.9928066730499268, -3.7779598236083984, -3.563112497329712, -3.3482654094696045, -3.133418321609497, -2.9185714721679688, -2.7037243843078613, -2.488877296447754, -2.2740302085876465, -2.059183120727539, -1.8443361520767212, -1.6294890642166138, -1.414642095565796, -1.1997950077056885, -0.9849479794502258, -0.7701009511947632, -0.5552538633346558, -0.3404068946838379, -0.12555980682373047, 0.08928723633289337, 0.3041342794895172, 0.5189813375473022, 0.7338283658027649, 0.9486753940582275, 1.163522481918335, 1.3783694505691528, 1.5932165384292603, 1.8080636262893677, 2.0229105949401855, 2.237757682800293, 2.4526047706604004, 2.667451858520508, 2.8822989463806152, 3.0971457958221436, 3.311992883682251, 3.5268399715423584, 3.741687059402466, 3.956533908843994, 4.171380996704102, 4.386228084564209, 4.601075172424316, 4.815922260284424, 5.030769348144531, 5.245616436004639, 5.460463523864746, 5.6753106117248535, 5.890157699584961, 6.10500431060791, 6.319851875305176, 6.534698486328125, 6.749545574188232]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 1.0, 4.0, 4.0, 6.0, 7.0, 11.0, 6.0, 12.0, 20.0, 19.0, 35.0, 31.0, 54.0, 48.0, 65.0, 115.0, 144.0, 207.0, 365.0, 538.0, 956.0, 1705.0, 3611.0, 9285.0, 32687.0, 319047.0, 3720014.0, 76978.0, 16842.0, 5734.0, 2516.0, 1225.0, 695.0, 417.0, 276.0, 183.0, 112.0, 77.0, 61.0, 38.0, 34.0, 26.0, 13.0, 15.0, 12.0, 12.0, 10.0, 3.0, 3.0, 4.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-2.76953125, -2.68621826171875, -2.6029052734375, -2.51959228515625, -2.436279296875, -2.35296630859375, -2.2696533203125, -2.18634033203125, -2.10302734375, -2.01971435546875, -1.9364013671875, -1.85308837890625, -1.769775390625, -1.68646240234375, -1.6031494140625, -1.51983642578125, -1.4365234375, -1.35321044921875, -1.2698974609375, -1.18658447265625, -1.103271484375, -1.01995849609375, -0.9366455078125, -0.85333251953125, -0.77001953125, -0.68670654296875, -0.6033935546875, -0.52008056640625, -0.436767578125, -0.35345458984375, -0.2701416015625, -0.18682861328125, -0.103515625, -0.02020263671875, 0.0631103515625, 0.14642333984375, 0.229736328125, 0.31304931640625, 0.3963623046875, 0.47967529296875, 0.56298828125, 0.64630126953125, 0.7296142578125, 0.81292724609375, 0.896240234375, 0.97955322265625, 1.0628662109375, 1.14617919921875, 1.2294921875, 1.31280517578125, 1.3961181640625, 1.47943115234375, 1.562744140625, 1.64605712890625, 1.7293701171875, 1.81268310546875, 1.89599609375, 1.97930908203125, 2.0626220703125, 2.14593505859375, 2.229248046875, 2.31256103515625, 2.3958740234375, 2.47918701171875, 2.5625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 5.0, 3.0, 2.0, 4.0, 9.0, 13.0, 20.0, 29.0, 52.0, 68.0, 79.0, 100.0, 100.0, 102.0, 94.0, 84.0, 69.0, 40.0, 47.0, 22.0, 24.0, 14.0, 11.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.7890625, -0.7645950317382812, -0.7401275634765625, -0.7156600952148438, -0.691192626953125, -0.6667251586914062, -0.6422576904296875, -0.6177902221679688, -0.59332275390625, -0.5688552856445312, -0.5443878173828125, -0.5199203491210938, -0.495452880859375, -0.47098541259765625, -0.4465179443359375, -0.42205047607421875, -0.3975830078125, -0.37311553955078125, -0.3486480712890625, -0.32418060302734375, -0.299713134765625, -0.27524566650390625, -0.2507781982421875, -0.22631072998046875, -0.20184326171875, -0.17737579345703125, -0.1529083251953125, -0.12844085693359375, -0.103973388671875, -0.07950592041015625, -0.0550384521484375, -0.03057098388671875, -0.006103515625, 0.01836395263671875, 0.0428314208984375, 0.06729888916015625, 0.091766357421875, 0.11623382568359375, 0.1407012939453125, 0.16516876220703125, 0.18963623046875, 0.21410369873046875, 0.2385711669921875, 0.26303863525390625, 0.287506103515625, 0.31197357177734375, 0.3364410400390625, 0.36090850830078125, 0.3853759765625, 0.40984344482421875, 0.4343109130859375, 0.45877838134765625, 0.483245849609375, 0.5077133178710938, 0.5321807861328125, 0.5566482543945312, 0.58111572265625, 0.6055831909179688, 0.6300506591796875, 0.6545181274414062, 0.678985595703125, 0.7034530639648438, 0.7279205322265625, 0.7523880004882812, 0.77685546875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 7.0, 3.0, 11.0, 14.0, 33.0, 29.0, 41.0, 69.0, 95.0, 115.0, 203.0, 253.0, 423.0, 620.0, 1083.0, 2448.0, 7586.0, 37593.0, 1162235.0, 2922803.0, 44487.0, 8354.0, 2622.0, 1163.0, 702.0, 421.0, 277.0, 181.0, 140.0, 88.0, 56.0, 35.0, 20.0, 27.0, 20.0, 10.0, 9.0, 7.0, 3.0, 1.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.9453125, -2.86358642578125, -2.7818603515625, -2.70013427734375, -2.618408203125, -2.53668212890625, -2.4549560546875, -2.37322998046875, -2.29150390625, -2.20977783203125, -2.1280517578125, -2.04632568359375, -1.964599609375, -1.88287353515625, -1.8011474609375, -1.71942138671875, -1.6376953125, -1.55596923828125, -1.4742431640625, -1.39251708984375, -1.310791015625, -1.22906494140625, -1.1473388671875, -1.06561279296875, -0.98388671875, -0.90216064453125, -0.8204345703125, -0.73870849609375, -0.656982421875, -0.57525634765625, -0.4935302734375, -0.41180419921875, -0.330078125, -0.24835205078125, -0.1666259765625, -0.08489990234375, -0.003173828125, 0.07855224609375, 0.1602783203125, 0.24200439453125, 0.32373046875, 0.40545654296875, 0.4871826171875, 0.56890869140625, 0.650634765625, 0.73236083984375, 0.8140869140625, 0.89581298828125, 0.9775390625, 1.05926513671875, 1.1409912109375, 1.22271728515625, 1.304443359375, 1.38616943359375, 1.4678955078125, 1.54962158203125, 1.63134765625, 1.71307373046875, 1.7947998046875, 1.87652587890625, 1.958251953125, 2.03997802734375, 2.1217041015625, 2.20343017578125, 2.28515625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 8.0, 12.0, 26.0, 59.0, 172.0, 1556.0, 1921.0, 188.0, 59.0, 31.0, 18.0, 9.0, 5.0, 7.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6533203125, -1.5897674560546875, -1.526214599609375, -1.4626617431640625, -1.39910888671875, -1.3355560302734375, -1.272003173828125, -1.2084503173828125, -1.1448974609375, -1.0813446044921875, -1.017791748046875, -0.9542388916015625, -0.89068603515625, -0.8271331787109375, -0.763580322265625, -0.7000274658203125, -0.636474609375, -0.5729217529296875, -0.509368896484375, -0.4458160400390625, -0.38226318359375, -0.3187103271484375, -0.255157470703125, -0.1916046142578125, -0.1280517578125, -0.0644989013671875, -0.000946044921875, 0.0626068115234375, 0.12615966796875, 0.1897125244140625, 0.253265380859375, 0.3168182373046875, 0.38037109375, 0.4439239501953125, 0.507476806640625, 0.5710296630859375, 0.63458251953125, 0.6981353759765625, 0.761688232421875, 0.8252410888671875, 0.8887939453125, 0.9523468017578125, 1.015899658203125, 1.0794525146484375, 1.14300537109375, 1.2065582275390625, 1.270111083984375, 1.3336639404296875, 1.397216796875, 1.4607696533203125, 1.524322509765625, 1.5878753662109375, 1.65142822265625, 1.7149810791015625, 1.778533935546875, 1.8420867919921875, 1.9056396484375, 1.9691925048828125, 2.032745361328125, 2.0962982177734375, 2.15985107421875, 2.2234039306640625, 2.286956787109375, 2.3505096435546875, 2.4140625]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 9.0, 9.0, 15.0, 27.0, 47.0, 90.0, 128.0, 176.0, 181.0, 117.0, 104.0, 38.0, 27.0, 9.0, 9.0, 3.0, 2.0, 2.0, 4.0, 3.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.853998184204102, -6.669008731842041, -6.484019756317139, -6.299030303955078, -6.114041328430176, -5.929051876068115, -5.744062423706055, -5.559073448181152, -5.374083995819092, -5.189094543457031, -5.004105567932129, -4.819116115570068, -4.634126663208008, -4.4491376876831055, -4.264148235321045, -4.079158782958984, -3.894169807434082, -3.7091805934906006, -3.524191379547119, -3.3392019271850586, -3.154212713241577, -2.9692234992980957, -2.784234046936035, -2.5992448329925537, -2.4142556190490723, -2.229266405105591, -2.0442771911621094, -1.8592877388000488, -1.6742985248565674, -1.489309310913086, -1.304319977760315, -1.119330644607544, -0.9343414306640625, -0.7493521571159363, -0.5643628835678101, -0.37937361001968384, -0.19438433647155762, -0.009395062923431396, 0.17559421062469482, 0.3605835437774658, 0.5455727577209473, 0.7305620312690735, 0.9155513048171997, 1.1005406379699707, 1.2855298519134521, 1.4705190658569336, 1.6555083990097046, 1.8404977321624756, 2.025486946105957, 2.2104761600494385, 2.39546537399292, 2.5804548263549805, 2.765444040298462, 2.9504332542419434, 3.135422706604004, 3.3204119205474854, 3.505401134490967, 3.6903903484344482, 3.8753795623779297, 4.06036901473999, 4.245358467102051, 4.430347442626953, 4.615336894989014, 4.800326347351074, 4.985315322875977]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 5.0, 2.0, 9.0, 9.0, 12.0, 16.0, 33.0, 42.0, 51.0, 53.0, 66.0, 81.0, 76.0, 77.0, 96.0, 64.0, 73.0, 50.0, 53.0, 41.0, 24.0, 18.0, 21.0, 6.0, 8.0, 9.0, 5.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.932065963745117, -3.772571563720703, -3.613077163696289, -3.453583002090454, -3.29408860206604, -3.134594202041626, -2.975100040435791, -2.815605640411377, -2.656111240386963, -2.496616840362549, -2.3371224403381348, -2.1776282787323, -2.0181338787078857, -1.8586394786834717, -1.6991451978683472, -1.5396509170532227, -1.3801565170288086, -1.2206621170043945, -1.06116783618927, -0.9016734957695007, -0.7421791553497314, -0.5826848149299622, -0.42319047451019287, -0.26369619369506836, -0.1042017936706543, 0.05529254674911499, 0.21478688716888428, 0.37428122758865356, 0.5337755680084229, 0.6932699084281921, 0.8527642488479614, 1.012258529663086, 1.1717529296875, 1.331247329711914, 1.4907416105270386, 1.650235891342163, 1.8097302913665771, 1.9692246913909912, 2.128718852996826, 2.2882132530212402, 2.4477076530456543, 2.6072020530700684, 2.7666964530944824, 2.9261906147003174, 3.0856850147247314, 3.2451794147491455, 3.4046735763549805, 3.5641679763793945, 3.7236623764038086, 3.8831567764282227, 4.042651176452637, 4.202145576477051, 4.361639976501465, 4.521133899688721, 4.680628299713135, 4.840122699737549, 4.999617099761963, 5.159111499786377, 5.318605899810791, 5.478100299835205, 5.637594223022461, 5.797088623046875, 5.956583023071289, 6.116077423095703, 6.275571823120117]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 5.0, 4.0, 8.0, 4.0, 14.0, 16.0, 27.0, 26.0, 49.0, 78.0, 93.0, 127.0, 160.0, 237.0, 398.0, 621.0, 1058.0, 1722.0, 3652.0, 8466.0, 24708.0, 91722.0, 357865.0, 400129.0, 110030.0, 28707.0, 9585.0, 3978.0, 1957.0, 1104.0, 664.0, 367.0, 312.0, 203.0, 130.0, 101.0, 62.0, 34.0, 36.0, 28.0, 14.0, 18.0, 13.0, 7.0, 4.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0], "bins": [-2.005859375, -1.94329833984375, -1.8807373046875, -1.81817626953125, -1.755615234375, -1.69305419921875, -1.6304931640625, -1.56793212890625, -1.50537109375, -1.44281005859375, -1.3802490234375, -1.31768798828125, -1.255126953125, -1.19256591796875, -1.1300048828125, -1.06744384765625, -1.0048828125, -0.94232177734375, -0.8797607421875, -0.81719970703125, -0.754638671875, -0.69207763671875, -0.6295166015625, -0.56695556640625, -0.50439453125, -0.44183349609375, -0.3792724609375, -0.31671142578125, -0.254150390625, -0.19158935546875, -0.1290283203125, -0.06646728515625, -0.00390625, 0.05865478515625, 0.1212158203125, 0.18377685546875, 0.246337890625, 0.30889892578125, 0.3714599609375, 0.43402099609375, 0.49658203125, 0.55914306640625, 0.6217041015625, 0.68426513671875, 0.746826171875, 0.80938720703125, 0.8719482421875, 0.93450927734375, 0.9970703125, 1.05963134765625, 1.1221923828125, 1.18475341796875, 1.247314453125, 1.30987548828125, 1.3724365234375, 1.43499755859375, 1.49755859375, 1.56011962890625, 1.6226806640625, 1.68524169921875, 1.747802734375, 1.81036376953125, 1.8729248046875, 1.93548583984375, 1.998046875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 7.0, 4.0, 6.0, 16.0, 27.0, 32.0, 50.0, 65.0, 89.0, 106.0, 98.0, 106.0, 94.0, 81.0, 69.0, 39.0, 32.0, 27.0, 19.0, 8.0, 10.0, 4.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.81103515625, -0.783966064453125, -0.75689697265625, -0.729827880859375, -0.7027587890625, -0.675689697265625, -0.64862060546875, -0.621551513671875, -0.594482421875, -0.567413330078125, -0.54034423828125, -0.513275146484375, -0.4862060546875, -0.459136962890625, -0.43206787109375, -0.404998779296875, -0.3779296875, -0.350860595703125, -0.32379150390625, -0.296722412109375, -0.2696533203125, -0.242584228515625, -0.21551513671875, -0.188446044921875, -0.161376953125, -0.134307861328125, -0.10723876953125, -0.080169677734375, -0.0531005859375, -0.026031494140625, 0.00103759765625, 0.028106689453125, 0.05517578125, 0.082244873046875, 0.10931396484375, 0.136383056640625, 0.1634521484375, 0.190521240234375, 0.21759033203125, 0.244659423828125, 0.271728515625, 0.298797607421875, 0.32586669921875, 0.352935791015625, 0.3800048828125, 0.407073974609375, 0.43414306640625, 0.461212158203125, 0.48828125, 0.515350341796875, 0.54241943359375, 0.569488525390625, 0.5965576171875, 0.623626708984375, 0.65069580078125, 0.677764892578125, 0.704833984375, 0.731903076171875, 0.75897216796875, 0.786041259765625, 0.8131103515625, 0.840179443359375, 0.86724853515625, 0.894317626953125, 0.92138671875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 2.0, 3.0, 4.0, 3.0, 12.0, 26.0, 22.0, 33.0, 50.0, 105.0, 155.0, 259.0, 433.0, 820.0, 1670.0, 3509.0, 8394.0, 21835.0, 67962.0, 247397.0, 454936.0, 165859.0, 47052.0, 16078.0, 6304.0, 2744.0, 1260.0, 647.0, 350.0, 222.0, 113.0, 95.0, 53.0, 49.0, 30.0, 24.0, 16.0, 11.0, 6.0, 0.0, 6.0, 3.0, 4.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4736328125, -1.4266204833984375, -1.379608154296875, -1.3325958251953125, -1.28558349609375, -1.2385711669921875, -1.191558837890625, -1.1445465087890625, -1.0975341796875, -1.0505218505859375, -1.003509521484375, -0.9564971923828125, -0.90948486328125, -0.8624725341796875, -0.815460205078125, -0.7684478759765625, -0.721435546875, -0.6744232177734375, -0.627410888671875, -0.5803985595703125, -0.53338623046875, -0.4863739013671875, -0.439361572265625, -0.3923492431640625, -0.3453369140625, -0.2983245849609375, -0.251312255859375, -0.2042999267578125, -0.15728759765625, -0.1102752685546875, -0.063262939453125, -0.0162506103515625, 0.03076171875, 0.0777740478515625, 0.124786376953125, 0.1717987060546875, 0.21881103515625, 0.2658233642578125, 0.312835693359375, 0.3598480224609375, 0.4068603515625, 0.4538726806640625, 0.500885009765625, 0.5478973388671875, 0.59490966796875, 0.6419219970703125, 0.688934326171875, 0.7359466552734375, 0.782958984375, 0.8299713134765625, 0.876983642578125, 0.9239959716796875, 0.97100830078125, 1.0180206298828125, 1.065032958984375, 1.1120452880859375, 1.1590576171875, 1.2060699462890625, 1.253082275390625, 1.3000946044921875, 1.34710693359375, 1.3941192626953125, 1.441131591796875, 1.4881439208984375, 1.53515625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 8.0, 8.0, 9.0, 12.0, 16.0, 27.0, 34.0, 35.0, 28.0, 56.0, 56.0, 74.0, 70.0, 60.0, 67.0, 69.0, 70.0, 59.0, 50.0, 37.0, 25.0, 26.0, 30.0, 21.0, 15.0, 9.0, 6.0, 8.0, 3.0, 4.0, 4.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-3.294921875, -3.21002197265625, -3.1251220703125, -3.04022216796875, -2.955322265625, -2.87042236328125, -2.7855224609375, -2.70062255859375, -2.61572265625, -2.53082275390625, -2.4459228515625, -2.36102294921875, -2.276123046875, -2.19122314453125, -2.1063232421875, -2.02142333984375, -1.9365234375, -1.85162353515625, -1.7667236328125, -1.68182373046875, -1.596923828125, -1.51202392578125, -1.4271240234375, -1.34222412109375, -1.25732421875, -1.17242431640625, -1.0875244140625, -1.00262451171875, -0.917724609375, -0.83282470703125, -0.7479248046875, -0.66302490234375, -0.578125, -0.49322509765625, -0.4083251953125, -0.32342529296875, -0.238525390625, -0.15362548828125, -0.0687255859375, 0.01617431640625, 0.10107421875, 0.18597412109375, 0.2708740234375, 0.35577392578125, 0.440673828125, 0.52557373046875, 0.6104736328125, 0.69537353515625, 0.7802734375, 0.86517333984375, 0.9500732421875, 1.03497314453125, 1.119873046875, 1.20477294921875, 1.2896728515625, 1.37457275390625, 1.45947265625, 1.54437255859375, 1.6292724609375, 1.71417236328125, 1.799072265625, 1.88397216796875, 1.9688720703125, 2.05377197265625, 2.138671875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 5.0, 6.0, 8.0, 15.0, 19.0, 41.0, 58.0, 92.0, 187.0, 365.0, 718.0, 1976.0, 6228.0, 28617.0, 258445.0, 654641.0, 78747.0, 12883.0, 3266.0, 1097.0, 551.0, 239.0, 154.0, 83.0, 43.0, 33.0, 18.0, 12.0, 6.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1650390625, -1.1300048828125, -1.094970703125, -1.0599365234375, -1.02490234375, -0.9898681640625, -0.954833984375, -0.9197998046875, -0.884765625, -0.8497314453125, -0.814697265625, -0.7796630859375, -0.74462890625, -0.7095947265625, -0.674560546875, -0.6395263671875, -0.6044921875, -0.5694580078125, -0.534423828125, -0.4993896484375, -0.46435546875, -0.4293212890625, -0.394287109375, -0.3592529296875, -0.32421875, -0.2891845703125, -0.254150390625, -0.2191162109375, -0.18408203125, -0.1490478515625, -0.114013671875, -0.0789794921875, -0.0439453125, -0.0089111328125, 0.026123046875, 0.0611572265625, 0.09619140625, 0.1312255859375, 0.166259765625, 0.2012939453125, 0.236328125, 0.2713623046875, 0.306396484375, 0.3414306640625, 0.37646484375, 0.4114990234375, 0.446533203125, 0.4815673828125, 0.5166015625, 0.5516357421875, 0.586669921875, 0.6217041015625, 0.65673828125, 0.6917724609375, 0.726806640625, 0.7618408203125, 0.796875, 0.8319091796875, 0.866943359375, 0.9019775390625, 0.93701171875, 0.9720458984375, 1.007080078125, 1.0421142578125, 1.0771484375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 4.0, 7.0, 12.0, 12.0, 27.0, 37.0, 65.0, 93.0, 143.0, 159.0, 175.0, 110.0, 62.0, 32.0, 27.0, 18.0, 17.0, 6.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.28640365600586e-05, -8.605979382991791e-05, -7.925555109977722e-05, -7.245130836963654e-05, -6.564706563949585e-05, -5.8842822909355164e-05, -5.203858017921448e-05, -4.523433744907379e-05, -3.8430094718933105e-05, -3.162585198879242e-05, -2.4821609258651733e-05, -1.8017366528511047e-05, -1.1213123798370361e-05, -4.408881068229675e-06, 2.3953616619110107e-06, 9.199604392051697e-06, 1.6003847122192383e-05, 2.280808985233307e-05, 2.9612332582473755e-05, 3.641657531261444e-05, 4.322081804275513e-05, 5.002506077289581e-05, 5.68293035030365e-05, 6.363354623317719e-05, 7.043778896331787e-05, 7.724203169345856e-05, 8.404627442359924e-05, 9.085051715373993e-05, 9.765475988388062e-05, 0.0001044590026140213, 0.00011126324534416199, 0.00011806748807430267, 0.00012487173080444336, 0.00013167597353458405, 0.00013848021626472473, 0.00014528445899486542, 0.0001520887017250061, 0.0001588929444551468, 0.00016569718718528748, 0.00017250142991542816, 0.00017930567264556885, 0.00018610991537570953, 0.00019291415810585022, 0.0001997184008359909, 0.0002065226435661316, 0.00021332688629627228, 0.00022013112902641296, 0.00022693537175655365, 0.00023373961448669434, 0.00024054385721683502, 0.0002473480999469757, 0.0002541523426771164, 0.0002609565854072571, 0.00026776082813739777, 0.00027456507086753845, 0.00028136931359767914, 0.0002881735563278198, 0.0002949777990579605, 0.0003017820417881012, 0.0003085862845182419, 0.00031539052724838257, 0.00032219476997852325, 0.00032899901270866394, 0.0003358032554388046, 0.0003426074981689453]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 4.0, 2.0, 6.0, 5.0, 7.0, 17.0, 17.0, 42.0, 48.0, 86.0, 96.0, 223.0, 318.0, 632.0, 1130.0, 2466.0, 6266.0, 19539.0, 81246.0, 387271.0, 423959.0, 91758.0, 21123.0, 6722.0, 2758.0, 1289.0, 612.0, 379.0, 198.0, 136.0, 64.0, 59.0, 30.0, 23.0, 12.0, 3.0, 3.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.62255859375, -0.5995330810546875, -0.576507568359375, -0.5534820556640625, -0.53045654296875, -0.5074310302734375, -0.484405517578125, -0.4613800048828125, -0.4383544921875, -0.4153289794921875, -0.392303466796875, -0.3692779541015625, -0.34625244140625, -0.3232269287109375, -0.300201416015625, -0.2771759033203125, -0.254150390625, -0.2311248779296875, -0.208099365234375, -0.1850738525390625, -0.16204833984375, -0.1390228271484375, -0.115997314453125, -0.0929718017578125, -0.0699462890625, -0.0469207763671875, -0.023895263671875, -0.0008697509765625, 0.02215576171875, 0.0451812744140625, 0.068206787109375, 0.0912322998046875, 0.1142578125, 0.1372833251953125, 0.160308837890625, 0.1833343505859375, 0.20635986328125, 0.2293853759765625, 0.252410888671875, 0.2754364013671875, 0.2984619140625, 0.3214874267578125, 0.344512939453125, 0.3675384521484375, 0.39056396484375, 0.4135894775390625, 0.436614990234375, 0.4596405029296875, 0.482666015625, 0.5056915283203125, 0.528717041015625, 0.5517425537109375, 0.57476806640625, 0.5977935791015625, 0.620819091796875, 0.6438446044921875, 0.6668701171875, 0.6898956298828125, 0.712921142578125, 0.7359466552734375, 0.75897216796875, 0.7819976806640625, 0.805023193359375, 0.8280487060546875, 0.85107421875]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 6.0, 1.0, 2.0, 2.0, 5.0, 7.0, 11.0, 11.0, 17.0, 16.0, 30.0, 44.0, 57.0, 77.0, 105.0, 131.0, 122.0, 107.0, 80.0, 42.0, 32.0, 43.0, 22.0, 8.0, 10.0, 4.0, 8.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1279296875, -1.090087890625, -1.05224609375, -1.014404296875, -0.9765625, -0.938720703125, -0.90087890625, -0.863037109375, -0.8251953125, -0.787353515625, -0.74951171875, -0.711669921875, -0.673828125, -0.635986328125, -0.59814453125, -0.560302734375, -0.5224609375, -0.484619140625, -0.44677734375, -0.408935546875, -0.37109375, -0.333251953125, -0.29541015625, -0.257568359375, -0.2197265625, -0.181884765625, -0.14404296875, -0.106201171875, -0.068359375, -0.030517578125, 0.00732421875, 0.045166015625, 0.0830078125, 0.120849609375, 0.15869140625, 0.196533203125, 0.234375, 0.272216796875, 0.31005859375, 0.347900390625, 0.3857421875, 0.423583984375, 0.46142578125, 0.499267578125, 0.537109375, 0.574951171875, 0.61279296875, 0.650634765625, 0.6884765625, 0.726318359375, 0.76416015625, 0.802001953125, 0.83984375, 0.877685546875, 0.91552734375, 0.953369140625, 0.9912109375, 1.029052734375, 1.06689453125, 1.104736328125, 1.142578125, 1.180419921875, 1.21826171875, 1.256103515625, 1.2939453125]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 7.0, 14.0, 17.0, 21.0, 55.0, 72.0, 110.0, 151.0, 157.0, 162.0, 97.0, 59.0, 42.0, 16.0, 17.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.332056999206543, -7.817634582519531, -7.3032121658325195, -6.788789749145508, -6.274367332458496, -5.759944915771484, -5.245522499084473, -4.731100082397461, -4.216677665710449, -3.7022552490234375, -3.187832832336426, -2.673410415649414, -2.1589879989624023, -1.6445655822753906, -1.130143165588379, -0.6157207489013672, -0.10129833221435547, 0.41312408447265625, 0.927546501159668, 1.4419689178466797, 1.9563913345336914, 2.470813751220703, 2.985236167907715, 3.4996585845947266, 4.014081001281738, 4.52850341796875, 5.042925834655762, 5.557348251342773, 6.071770668029785, 6.586193084716797, 7.100615501403809, 7.61503791809082, 8.129459381103516, 8.643881797790527, 9.158304214477539, 9.67272663116455, 10.187149047851562, 10.701571464538574, 11.215993881225586, 11.730416297912598, 12.24483871459961, 12.759261131286621, 13.273683547973633, 13.788105964660645, 14.302528381347656, 14.816950798034668, 15.33137321472168, 15.845795631408691, 16.360218048095703, 16.87464141845703, 17.389062881469727, 17.903484344482422, 18.41790771484375, 18.932331085205078, 19.446752548217773, 19.96117401123047, 20.475597381591797, 20.990020751953125, 21.50444221496582, 22.018863677978516, 22.533287048339844, 23.047710418701172, 23.562131881713867, 24.076553344726562, 24.59097671508789]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 9.0, 7.0, 10.0, 17.0, 17.0, 24.0, 31.0, 33.0, 43.0, 38.0, 51.0, 39.0, 52.0, 42.0, 39.0, 66.0, 64.0, 55.0, 52.0, 52.0, 35.0, 42.0, 30.0, 23.0, 25.0, 22.0, 14.0, 21.0, 13.0, 11.0, 10.0, 7.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.562973022460938, -11.183988571166992, -10.805004119873047, -10.426019668579102, -10.047036170959473, -9.668051719665527, -9.289067268371582, -8.910082817077637, -8.531098365783691, -8.152113914489746, -7.773129940032959, -7.394145488739014, -7.015161037445068, -6.636177062988281, -6.257192611694336, -5.878208160400391, -5.4992241859436035, -5.120239734649658, -4.741255760192871, -4.362271308898926, -3.9832868576049805, -3.6043026447296143, -3.225318431854248, -2.8463339805603027, -2.4673497676849365, -2.0883655548095703, -1.709381103515625, -1.3303968906402588, -0.951412558555603, -0.5724282264709473, -0.19344401359558105, 0.18554043769836426, 0.5645246505737305, 0.9435089826583862, 1.322493314743042, 1.7014775276184082, 2.0804619789123535, 2.4594461917877197, 2.838430404663086, 3.2174148559570312, 3.5963990688323975, 3.9753832817077637, 4.354367733001709, 4.733351707458496, 5.112336158752441, 5.491320610046387, 5.870305061340332, 6.249289512634277, 6.6282734870910645, 7.00725793838501, 7.386241912841797, 7.765226364135742, 8.144210815429688, 8.523195266723633, 8.902179718017578, 9.281164169311523, 9.660147666931152, 10.039132118225098, 10.418116569519043, 10.797100067138672, 11.176084518432617, 11.555068969726562, 11.934053421020508, 12.313037872314453, 12.692022323608398]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 5.0, 2.0, 2.0, 2.0, 3.0, 2.0, 4.0, 6.0, 9.0, 6.0, 12.0, 8.0, 24.0, 29.0, 56.0, 74.0, 150.0, 296.0, 618.0, 1636.0, 6240.0, 51202.0, 4096515.0, 30251.0, 4669.0, 1367.0, 532.0, 236.0, 134.0, 69.0, 41.0, 23.0, 16.0, 9.0, 9.0, 7.0, 5.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.5234375, -4.37939453125, -4.2353515625, -4.09130859375, -3.947265625, -3.80322265625, -3.6591796875, -3.51513671875, -3.37109375, -3.22705078125, -3.0830078125, -2.93896484375, -2.794921875, -2.65087890625, -2.5068359375, -2.36279296875, -2.21875, -2.07470703125, -1.9306640625, -1.78662109375, -1.642578125, -1.49853515625, -1.3544921875, -1.21044921875, -1.06640625, -0.92236328125, -0.7783203125, -0.63427734375, -0.490234375, -0.34619140625, -0.2021484375, -0.05810546875, 0.0859375, 0.22998046875, 0.3740234375, 0.51806640625, 0.662109375, 0.80615234375, 0.9501953125, 1.09423828125, 1.23828125, 1.38232421875, 1.5263671875, 1.67041015625, 1.814453125, 1.95849609375, 2.1025390625, 2.24658203125, 2.390625, 2.53466796875, 2.6787109375, 2.82275390625, 2.966796875, 3.11083984375, 3.2548828125, 3.39892578125, 3.54296875, 3.68701171875, 3.8310546875, 3.97509765625, 4.119140625, 4.26318359375, 4.4072265625, 4.55126953125, 4.6953125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 4.0, 2.0, 4.0, 5.0, 8.0, 20.0, 20.0, 18.0, 48.0, 60.0, 48.0, 84.0, 84.0, 100.0, 95.0, 91.0, 70.0, 68.0, 35.0, 51.0, 31.0, 17.0, 11.0, 12.0, 7.0, 3.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.90771484375, -0.8783721923828125, -0.849029541015625, -0.8196868896484375, -0.79034423828125, -0.7610015869140625, -0.731658935546875, -0.7023162841796875, -0.6729736328125, -0.6436309814453125, -0.614288330078125, -0.5849456787109375, -0.55560302734375, -0.5262603759765625, -0.496917724609375, -0.4675750732421875, -0.438232421875, -0.4088897705078125, -0.379547119140625, -0.3502044677734375, -0.32086181640625, -0.2915191650390625, -0.262176513671875, -0.2328338623046875, -0.2034912109375, -0.1741485595703125, -0.144805908203125, -0.1154632568359375, -0.08612060546875, -0.0567779541015625, -0.027435302734375, 0.0019073486328125, 0.03125, 0.0605926513671875, 0.089935302734375, 0.1192779541015625, 0.14862060546875, 0.1779632568359375, 0.207305908203125, 0.2366485595703125, 0.2659912109375, 0.2953338623046875, 0.324676513671875, 0.3540191650390625, 0.38336181640625, 0.4127044677734375, 0.442047119140625, 0.4713897705078125, 0.500732421875, 0.5300750732421875, 0.559417724609375, 0.5887603759765625, 0.61810302734375, 0.6474456787109375, 0.676788330078125, 0.7061309814453125, 0.7354736328125, 0.7648162841796875, 0.794158935546875, 0.8235015869140625, 0.85284423828125, 0.8821868896484375, 0.911529541015625, 0.9408721923828125, 0.97021484375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 2.0, 2.0, 5.0, 11.0, 17.0, 12.0, 22.0, 25.0, 25.0, 38.0, 54.0, 78.0, 76.0, 108.0, 146.0, 256.0, 379.0, 762.0, 1671.0, 4634.0, 22595.0, 3870615.0, 271619.0, 14341.0, 3618.0, 1305.0, 626.0, 353.0, 248.0, 168.0, 122.0, 86.0, 53.0, 48.0, 30.0, 27.0, 29.0, 17.0, 12.0, 7.0, 10.0, 13.0, 6.0, 4.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-3.953125, -3.82513427734375, -3.6971435546875, -3.56915283203125, -3.441162109375, -3.31317138671875, -3.1851806640625, -3.05718994140625, -2.92919921875, -2.80120849609375, -2.6732177734375, -2.54522705078125, -2.417236328125, -2.28924560546875, -2.1612548828125, -2.03326416015625, -1.9052734375, -1.77728271484375, -1.6492919921875, -1.52130126953125, -1.393310546875, -1.26531982421875, -1.1373291015625, -1.00933837890625, -0.88134765625, -0.75335693359375, -0.6253662109375, -0.49737548828125, -0.369384765625, -0.24139404296875, -0.1134033203125, 0.01458740234375, 0.142578125, 0.27056884765625, 0.3985595703125, 0.52655029296875, 0.654541015625, 0.78253173828125, 0.9105224609375, 1.03851318359375, 1.16650390625, 1.29449462890625, 1.4224853515625, 1.55047607421875, 1.678466796875, 1.80645751953125, 1.9344482421875, 2.06243896484375, 2.1904296875, 2.31842041015625, 2.4464111328125, 2.57440185546875, 2.702392578125, 2.83038330078125, 2.9583740234375, 3.08636474609375, 3.21435546875, 3.34234619140625, 3.4703369140625, 3.59832763671875, 3.726318359375, 3.85430908203125, 3.9822998046875, 4.11029052734375, 4.23828125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 2.0, 4.0, 6.0, 13.0, 26.0, 106.0, 3401.0, 426.0, 55.0, 19.0, 10.0, 5.0, 1.0, 4.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9326171875, -0.891876220703125, -0.85113525390625, -0.810394287109375, -0.7696533203125, -0.728912353515625, -0.68817138671875, -0.647430419921875, -0.606689453125, -0.565948486328125, -0.52520751953125, -0.484466552734375, -0.4437255859375, -0.402984619140625, -0.36224365234375, -0.321502685546875, -0.28076171875, -0.240020751953125, -0.19927978515625, -0.158538818359375, -0.1177978515625, -0.077056884765625, -0.03631591796875, 0.004425048828125, 0.045166015625, 0.085906982421875, 0.12664794921875, 0.167388916015625, 0.2081298828125, 0.248870849609375, 0.28961181640625, 0.330352783203125, 0.37109375, 0.411834716796875, 0.45257568359375, 0.493316650390625, 0.5340576171875, 0.574798583984375, 0.61553955078125, 0.656280517578125, 0.697021484375, 0.737762451171875, 0.77850341796875, 0.819244384765625, 0.8599853515625, 0.900726318359375, 0.94146728515625, 0.982208251953125, 1.02294921875, 1.063690185546875, 1.10443115234375, 1.145172119140625, 1.1859130859375, 1.226654052734375, 1.26739501953125, 1.308135986328125, 1.348876953125, 1.389617919921875, 1.43035888671875, 1.471099853515625, 1.5118408203125, 1.552581787109375, 1.59332275390625, 1.634063720703125, 1.6748046875]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 7.0, 17.0, 42.0, 72.0, 217.0, 314.0, 182.0, 94.0, 44.0, 7.0, 3.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0910727977752686, -2.906198263168335, -2.7213237285614014, -2.5364491939544678, -2.351574659347534, -2.1667001247406006, -1.9818254709243774, -1.7969509363174438, -1.6120764017105103, -1.4272018671035767, -1.242327332496643, -1.05745267868042, -0.8725782036781311, -0.6877036690711975, -0.5028290748596191, -0.31795454025268555, -0.13308000564575195, 0.051794543862342834, 0.23666909337043762, 0.4215436577796936, 0.6064181923866272, 0.7912927269935608, 0.9761673212051392, 1.1610418558120728, 1.3459163904190063, 1.53079092502594, 1.7156654596328735, 1.9005401134490967, 2.0854146480560303, 2.270289182662964, 2.4551637172698975, 2.640038251876831, 2.8249125480651855, 3.009787082672119, 3.1946616172790527, 3.3795361518859863, 3.56441068649292, 3.7492852210998535, 3.934159755706787, 4.119034290313721, 4.303908824920654, 4.488783359527588, 4.6736578941345215, 4.858532428741455, 5.043406963348389, 5.228281497955322, 5.413156032562256, 5.5980305671691895, 5.782905578613281, 5.967780113220215, 6.152654647827148, 6.337529182434082, 6.522403717041016, 6.707278251647949, 6.892152786254883, 7.077027320861816, 7.26190185546875, 7.446776390075684, 7.631650924682617, 7.816525459289551, 8.001399993896484, 8.186274528503418, 8.371149063110352, 8.556023597717285, 8.740898132324219]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 6.0, 6.0, 7.0, 5.0, 5.0, 21.0, 16.0, 17.0, 20.0, 27.0, 29.0, 28.0, 35.0, 31.0, 49.0, 44.0, 43.0, 56.0, 55.0, 55.0, 50.0, 43.0, 49.0, 46.0, 38.0, 36.0, 40.0, 25.0, 24.0, 16.0, 21.0, 22.0, 8.0, 11.0, 10.0, 2.0, 4.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.1871438026428223, -2.120305061340332, -2.053466558456421, -1.9866278171539307, -1.91978919506073, -1.8529505729675293, -1.7861119508743286, -1.719273328781128, -1.6524345874786377, -1.585595965385437, -1.5187573432922363, -1.451918601989746, -1.3850799798965454, -1.3182413578033447, -1.251402735710144, -1.1845641136169434, -1.1177254915237427, -1.050886869430542, -0.9840481877326965, -0.9172095656394958, -0.8503708839416504, -0.7835322618484497, -0.716693639755249, -0.6498550176620483, -0.5830163359642029, -0.5161777138710022, -0.44933903217315674, -0.38250041007995605, -0.315661758184433, -0.2488231062889099, -0.18198448419570923, -0.11514583230018616, -0.048307180404663086, 0.01853146404027939, 0.08537010848522186, 0.15220874547958374, 0.2190473973751068, 0.2858860492706299, 0.35272467136383057, 0.41956332325935364, 0.4864019751548767, 0.5532405972480774, 0.6200792789459229, 0.6869179010391235, 0.7537565231323242, 0.8205952048301697, 0.8874338269233704, 0.9542725086212158, 1.0211111307144165, 1.0879497528076172, 1.1547883749008179, 1.2216269969940186, 1.2884657382965088, 1.3553043603897095, 1.4221429824829102, 1.4889816045761108, 1.5558202266693115, 1.6226588487625122, 1.689497470855713, 1.7563362121582031, 1.8231748342514038, 1.8900134563446045, 1.9568520784378052, 2.023690700531006, 2.090529441833496]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 3.0, 4.0, 9.0, 10.0, 30.0, 20.0, 48.0, 107.0, 164.0, 270.0, 511.0, 1015.0, 2281.0, 5734.0, 17249.0, 60332.0, 224394.0, 452267.0, 204294.0, 54223.0, 15931.0, 5364.0, 2218.0, 993.0, 439.0, 281.0, 149.0, 72.0, 64.0, 40.0, 20.0, 10.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.205078125, -2.1326904296875, -2.060302734375, -1.9879150390625, -1.91552734375, -1.8431396484375, -1.770751953125, -1.6983642578125, -1.6259765625, -1.5535888671875, -1.481201171875, -1.4088134765625, -1.33642578125, -1.2640380859375, -1.191650390625, -1.1192626953125, -1.046875, -0.9744873046875, -0.902099609375, -0.8297119140625, -0.75732421875, -0.6849365234375, -0.612548828125, -0.5401611328125, -0.4677734375, -0.3953857421875, -0.322998046875, -0.2506103515625, -0.17822265625, -0.1058349609375, -0.033447265625, 0.0389404296875, 0.111328125, 0.1837158203125, 0.256103515625, 0.3284912109375, 0.40087890625, 0.4732666015625, 0.545654296875, 0.6180419921875, 0.6904296875, 0.7628173828125, 0.835205078125, 0.9075927734375, 0.97998046875, 1.0523681640625, 1.124755859375, 1.1971435546875, 1.26953125, 1.3419189453125, 1.414306640625, 1.4866943359375, 1.55908203125, 1.6314697265625, 1.703857421875, 1.7762451171875, 1.8486328125, 1.9210205078125, 1.993408203125, 2.0657958984375, 2.13818359375, 2.2105712890625, 2.282958984375, 2.3553466796875, 2.427734375]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 4.0, 1.0, 4.0, 9.0, 14.0, 15.0, 11.0, 28.0, 27.0, 46.0, 34.0, 47.0, 53.0, 68.0, 66.0, 68.0, 72.0, 76.0, 59.0, 44.0, 52.0, 49.0, 38.0, 24.0, 24.0, 24.0, 17.0, 10.0, 9.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.93896484375, -0.909515380859375, -0.88006591796875, -0.850616455078125, -0.8211669921875, -0.791717529296875, -0.76226806640625, -0.732818603515625, -0.703369140625, -0.673919677734375, -0.64447021484375, -0.615020751953125, -0.5855712890625, -0.556121826171875, -0.52667236328125, -0.497222900390625, -0.4677734375, -0.438323974609375, -0.40887451171875, -0.379425048828125, -0.3499755859375, -0.320526123046875, -0.29107666015625, -0.261627197265625, -0.232177734375, -0.202728271484375, -0.17327880859375, -0.143829345703125, -0.1143798828125, -0.084930419921875, -0.05548095703125, -0.026031494140625, 0.00341796875, 0.032867431640625, 0.06231689453125, 0.091766357421875, 0.1212158203125, 0.150665283203125, 0.18011474609375, 0.209564208984375, 0.239013671875, 0.268463134765625, 0.29791259765625, 0.327362060546875, 0.3568115234375, 0.386260986328125, 0.41571044921875, 0.445159912109375, 0.474609375, 0.504058837890625, 0.53350830078125, 0.562957763671875, 0.5924072265625, 0.621856689453125, 0.65130615234375, 0.680755615234375, 0.710205078125, 0.739654541015625, 0.76910400390625, 0.798553466796875, 0.8280029296875, 0.857452392578125, 0.88690185546875, 0.916351318359375, 0.94580078125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 9.0, 8.0, 13.0, 19.0, 21.0, 39.0, 52.0, 57.0, 103.0, 143.0, 265.0, 527.0, 1016.0, 2444.0, 6116.0, 17876.0, 70046.0, 373663.0, 457119.0, 85728.0, 21067.0, 6977.0, 2739.0, 1221.0, 537.0, 269.0, 148.0, 116.0, 65.0, 46.0, 28.0, 27.0, 25.0, 12.0, 5.0, 6.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.890625, -2.80047607421875, -2.7103271484375, -2.62017822265625, -2.530029296875, -2.43988037109375, -2.3497314453125, -2.25958251953125, -2.16943359375, -2.07928466796875, -1.9891357421875, -1.89898681640625, -1.808837890625, -1.71868896484375, -1.6285400390625, -1.53839111328125, -1.4482421875, -1.35809326171875, -1.2679443359375, -1.17779541015625, -1.087646484375, -0.99749755859375, -0.9073486328125, -0.81719970703125, -0.72705078125, -0.63690185546875, -0.5467529296875, -0.45660400390625, -0.366455078125, -0.27630615234375, -0.1861572265625, -0.09600830078125, -0.005859375, 0.08428955078125, 0.1744384765625, 0.26458740234375, 0.354736328125, 0.44488525390625, 0.5350341796875, 0.62518310546875, 0.71533203125, 0.80548095703125, 0.8956298828125, 0.98577880859375, 1.075927734375, 1.16607666015625, 1.2562255859375, 1.34637451171875, 1.4365234375, 1.52667236328125, 1.6168212890625, 1.70697021484375, 1.797119140625, 1.88726806640625, 1.9774169921875, 2.06756591796875, 2.15771484375, 2.24786376953125, 2.3380126953125, 2.42816162109375, 2.518310546875, 2.60845947265625, 2.6986083984375, 2.78875732421875, 2.87890625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 0.0, 1.0, 2.0, 5.0, 5.0, 9.0, 5.0, 5.0, 13.0, 12.0, 13.0, 17.0, 18.0, 23.0, 27.0, 36.0, 29.0, 49.0, 33.0, 51.0, 54.0, 51.0, 48.0, 54.0, 51.0, 40.0, 53.0, 50.0, 33.0, 41.0, 36.0, 28.0, 23.0, 14.0, 13.0, 13.0, 11.0, 4.0, 5.0, 6.0, 8.0, 4.0, 1.0, 6.0, 3.0, 0.0, 3.0, 5.0], "bins": [-4.78515625, -4.6619873046875, -4.538818359375, -4.4156494140625, -4.29248046875, -4.1693115234375, -4.046142578125, -3.9229736328125, -3.7998046875, -3.6766357421875, -3.553466796875, -3.4302978515625, -3.30712890625, -3.1839599609375, -3.060791015625, -2.9376220703125, -2.814453125, -2.6912841796875, -2.568115234375, -2.4449462890625, -2.32177734375, -2.1986083984375, -2.075439453125, -1.9522705078125, -1.8291015625, -1.7059326171875, -1.582763671875, -1.4595947265625, -1.33642578125, -1.2132568359375, -1.090087890625, -0.9669189453125, -0.84375, -0.7205810546875, -0.597412109375, -0.4742431640625, -0.35107421875, -0.2279052734375, -0.104736328125, 0.0184326171875, 0.1416015625, 0.2647705078125, 0.387939453125, 0.5111083984375, 0.63427734375, 0.7574462890625, 0.880615234375, 1.0037841796875, 1.126953125, 1.2501220703125, 1.373291015625, 1.4964599609375, 1.61962890625, 1.7427978515625, 1.865966796875, 1.9891357421875, 2.1123046875, 2.2354736328125, 2.358642578125, 2.4818115234375, 2.60498046875, 2.7281494140625, 2.851318359375, 2.9744873046875, 3.09765625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 8.0, 12.0, 16.0, 19.0, 64.0, 124.0, 308.0, 1087.0, 7519.0, 1012012.0, 24793.0, 1871.0, 424.0, 161.0, 62.0, 31.0, 17.0, 15.0, 4.0, 6.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.8203125, -7.6126708984375, -7.405029296875, -7.1973876953125, -6.98974609375, -6.7821044921875, -6.574462890625, -6.3668212890625, -6.1591796875, -5.9515380859375, -5.743896484375, -5.5362548828125, -5.32861328125, -5.1209716796875, -4.913330078125, -4.7056884765625, -4.498046875, -4.2904052734375, -4.082763671875, -3.8751220703125, -3.66748046875, -3.4598388671875, -3.252197265625, -3.0445556640625, -2.8369140625, -2.6292724609375, -2.421630859375, -2.2139892578125, -2.00634765625, -1.7987060546875, -1.591064453125, -1.3834228515625, -1.17578125, -0.9681396484375, -0.760498046875, -0.5528564453125, -0.34521484375, -0.1375732421875, 0.070068359375, 0.2777099609375, 0.4853515625, 0.6929931640625, 0.900634765625, 1.1082763671875, 1.31591796875, 1.5235595703125, 1.731201171875, 1.9388427734375, 2.146484375, 2.3541259765625, 2.561767578125, 2.7694091796875, 2.97705078125, 3.1846923828125, 3.392333984375, 3.5999755859375, 3.8076171875, 4.0152587890625, 4.222900390625, 4.4305419921875, 4.63818359375, 4.8458251953125, 5.053466796875, 5.2611083984375, 5.46875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 0.0, 9.0, 4.0, 20.0, 27.0, 48.0, 88.0, 99.0, 151.0, 164.0, 136.0, 109.0, 53.0, 35.0, 16.0, 18.0, 7.0, 8.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00028228759765625, -0.0002748984843492508, -0.0002675093710422516, -0.0002601202577352524, -0.0002527311444282532, -0.00024534203112125397, -0.00023795291781425476, -0.00023056380450725555, -0.00022317469120025635, -0.00021578557789325714, -0.00020839646458625793, -0.00020100735127925873, -0.00019361823797225952, -0.00018622912466526031, -0.0001788400113582611, -0.0001714508980512619, -0.0001640617847442627, -0.0001566726714372635, -0.00014928355813026428, -0.00014189444482326508, -0.00013450533151626587, -0.00012711621820926666, -0.00011972710490226746, -0.00011233799159526825, -0.00010494887828826904, -9.755976498126984e-05, -9.017065167427063e-05, -8.278153836727142e-05, -7.539242506027222e-05, -6.800331175327301e-05, -6.0614198446273804e-05, -5.32250851392746e-05, -4.583597183227539e-05, -3.8446858525276184e-05, -3.105774521827698e-05, -2.366863191127777e-05, -1.6279518604278564e-05, -8.890405297279358e-06, -1.5012919902801514e-06, 5.887821316719055e-06, 1.3276934623718262e-05, 2.0666047930717468e-05, 2.8055161237716675e-05, 3.544427454471588e-05, 4.283338785171509e-05, 5.0222501158714294e-05, 5.76116144657135e-05, 6.500072777271271e-05, 7.238984107971191e-05, 7.977895438671112e-05, 8.716806769371033e-05, 9.455718100070953e-05, 0.00010194629430770874, 0.00010933540761470795, 0.00011672452092170715, 0.00012411363422870636, 0.00013150274753570557, 0.00013889186084270477, 0.00014628097414970398, 0.00015367008745670319, 0.0001610592007637024, 0.0001684483140707016, 0.0001758374273777008, 0.0001832265406847, 0.00019061565399169922]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 3.0, 5.0, 4.0, 10.0, 15.0, 33.0, 61.0, 92.0, 195.0, 476.0, 1209.0, 4130.0, 47458.0, 949587.0, 39361.0, 3872.0, 1177.0, 478.0, 195.0, 106.0, 43.0, 18.0, 14.0, 6.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.064453125, -2.9700927734375, -2.875732421875, -2.7813720703125, -2.68701171875, -2.5926513671875, -2.498291015625, -2.4039306640625, -2.3095703125, -2.2152099609375, -2.120849609375, -2.0264892578125, -1.93212890625, -1.8377685546875, -1.743408203125, -1.6490478515625, -1.5546875, -1.4603271484375, -1.365966796875, -1.2716064453125, -1.17724609375, -1.0828857421875, -0.988525390625, -0.8941650390625, -0.7998046875, -0.7054443359375, -0.611083984375, -0.5167236328125, -0.42236328125, -0.3280029296875, -0.233642578125, -0.1392822265625, -0.044921875, 0.0494384765625, 0.143798828125, 0.2381591796875, 0.33251953125, 0.4268798828125, 0.521240234375, 0.6156005859375, 0.7099609375, 0.8043212890625, 0.898681640625, 0.9930419921875, 1.08740234375, 1.1817626953125, 1.276123046875, 1.3704833984375, 1.46484375, 1.5592041015625, 1.653564453125, 1.7479248046875, 1.84228515625, 1.9366455078125, 2.031005859375, 2.1253662109375, 2.2197265625, 2.3140869140625, 2.408447265625, 2.5028076171875, 2.59716796875, 2.6915283203125, 2.785888671875, 2.8802490234375, 2.974609375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 8.0, 7.0, 13.0, 11.0, 22.0, 62.0, 108.0, 220.0, 252.0, 143.0, 74.0, 35.0, 19.0, 9.0, 6.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.513671875, -2.413848876953125, -2.31402587890625, -2.214202880859375, -2.1143798828125, -2.014556884765625, -1.91473388671875, -1.814910888671875, -1.715087890625, -1.615264892578125, -1.51544189453125, -1.415618896484375, -1.3157958984375, -1.215972900390625, -1.11614990234375, -1.016326904296875, -0.91650390625, -0.816680908203125, -0.71685791015625, -0.617034912109375, -0.5172119140625, -0.417388916015625, -0.31756591796875, -0.217742919921875, -0.117919921875, -0.018096923828125, 0.08172607421875, 0.181549072265625, 0.2813720703125, 0.381195068359375, 0.48101806640625, 0.580841064453125, 0.6806640625, 0.780487060546875, 0.88031005859375, 0.980133056640625, 1.0799560546875, 1.179779052734375, 1.27960205078125, 1.379425048828125, 1.479248046875, 1.579071044921875, 1.67889404296875, 1.778717041015625, 1.8785400390625, 1.978363037109375, 2.07818603515625, 2.178009033203125, 2.27783203125, 2.377655029296875, 2.47747802734375, 2.577301025390625, 2.6771240234375, 2.776947021484375, 2.87677001953125, 2.976593017578125, 3.076416015625, 3.176239013671875, 3.27606201171875, 3.375885009765625, 3.4757080078125, 3.575531005859375, 3.67535400390625, 3.775177001953125, 3.875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 6.0, 6.0, 7.0, 17.0, 16.0, 32.0, 26.0, 44.0, 53.0, 51.0, 68.0, 95.0, 115.0, 91.0, 72.0, 54.0, 69.0, 51.0, 42.0, 16.0, 20.0, 22.0, 7.0, 9.0, 5.0, 4.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.282142639160156, -16.755569458007812, -16.2289981842041, -15.702425003051758, -15.17585277557373, -14.649280548095703, -14.12270736694336, -13.596135139465332, -13.069562911987305, -12.542990684509277, -12.016417503356934, -11.489845275878906, -10.963273048400879, -10.436700820922852, -9.910127639770508, -9.38355541229248, -8.856982231140137, -8.33041000366211, -7.803837299346924, -7.277264595031738, -6.750692367553711, -6.224119663238525, -5.69754695892334, -5.1709747314453125, -4.644402027130127, -4.117829322814941, -3.591257095336914, -3.0646843910217285, -2.538111925125122, -2.0115394592285156, -1.48496675491333, -0.9583942890167236, -0.4318218231201172, 0.09475070238113403, 0.6213232278823853, 1.1478958129882812, 1.6744682788848877, 2.201040744781494, 2.7276134490966797, 3.254185914993286, 3.7807583808898926, 4.307331085205078, 4.8339033126831055, 5.360476016998291, 5.887048721313477, 6.413620948791504, 6.9401936531066895, 7.466766357421875, 7.993338584899902, 8.51991081237793, 9.046483993530273, 9.5730562210083, 10.099628448486328, 10.626201629638672, 11.1527738571167, 11.679346084594727, 12.20591926574707, 12.732491493225098, 13.259064674377441, 13.785636901855469, 14.312209129333496, 14.838781356811523, 15.365354537963867, 15.891926765441895, 16.418498992919922]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 5.0, 5.0, 8.0, 10.0, 7.0, 10.0, 8.0, 12.0, 10.0, 20.0, 18.0, 31.0, 25.0, 36.0, 38.0, 44.0, 36.0, 49.0, 53.0, 44.0, 60.0, 35.0, 45.0, 37.0, 48.0, 33.0, 24.0, 33.0, 32.0, 30.0, 24.0, 21.0, 17.0, 21.0, 12.0, 12.0, 6.0, 7.0, 7.0, 9.0, 8.0, 3.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.726259231567383, -17.16609001159668, -16.605920791625977, -16.045751571655273, -15.485581398010254, -14.92541217803955, -14.365242004394531, -13.805072784423828, -13.244903564453125, -12.684734344482422, -12.124565124511719, -11.5643949508667, -11.004225730895996, -10.444056510925293, -9.883886337280273, -9.32371711730957, -8.763547897338867, -8.203378677368164, -7.643208980560303, -7.083039283752441, -6.522870063781738, -5.962700843811035, -5.402531147003174, -4.8423614501953125, -4.282192230224609, -3.722022771835327, -3.161853313446045, -2.6016838550567627, -2.0415143966674805, -1.4813449382781982, -0.921175479888916, -0.3610060214996338, 0.19916534423828125, 0.7593348026275635, 1.3195042610168457, 1.879673719406128, 2.43984317779541, 3.0000126361846924, 3.5601820945739746, 4.120351791381836, 4.680521011352539, 5.240690231323242, 5.8008599281311035, 6.361029624938965, 6.921198844909668, 7.481368064880371, 8.04153823852539, 8.601707458496094, 9.161876678466797, 9.7220458984375, 10.282215118408203, 10.842385292053223, 11.402554512023926, 11.962723731994629, 12.522893905639648, 13.083063125610352, 13.643232345581055, 14.203401565551758, 14.763570785522461, 15.32374095916748, 15.883910179138184, 16.444080352783203, 17.004249572753906, 17.56441879272461, 18.124588012695312]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 4.0, 8.0, 12.0, 7.0, 8.0, 21.0, 24.0, 53.0, 55.0, 83.0, 160.0, 178.0, 300.0, 524.0, 966.0, 2013.0, 5072.0, 16349.0, 111334.0, 4005365.0, 36108.0, 8989.0, 3228.0, 1409.0, 726.0, 404.0, 306.0, 191.0, 132.0, 70.0, 53.0, 44.0, 19.0, 20.0, 14.0, 16.0, 7.0, 6.0, 6.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.076171875, -2.974517822265625, -2.87286376953125, -2.771209716796875, -2.6695556640625, -2.567901611328125, -2.46624755859375, -2.364593505859375, -2.262939453125, -2.161285400390625, -2.05963134765625, -1.957977294921875, -1.8563232421875, -1.754669189453125, -1.65301513671875, -1.551361083984375, -1.44970703125, -1.348052978515625, -1.24639892578125, -1.144744873046875, -1.0430908203125, -0.941436767578125, -0.83978271484375, -0.738128662109375, -0.636474609375, -0.534820556640625, -0.43316650390625, -0.331512451171875, -0.2298583984375, -0.128204345703125, -0.02655029296875, 0.075103759765625, 0.1767578125, 0.278411865234375, 0.38006591796875, 0.481719970703125, 0.5833740234375, 0.685028076171875, 0.78668212890625, 0.888336181640625, 0.989990234375, 1.091644287109375, 1.19329833984375, 1.294952392578125, 1.3966064453125, 1.498260498046875, 1.59991455078125, 1.701568603515625, 1.80322265625, 1.904876708984375, 2.00653076171875, 2.108184814453125, 2.2098388671875, 2.311492919921875, 2.41314697265625, 2.514801025390625, 2.616455078125, 2.718109130859375, 2.81976318359375, 2.921417236328125, 3.0230712890625, 3.124725341796875, 3.22637939453125, 3.328033447265625, 3.4296875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 3.0, 6.0, 7.0, 10.0, 13.0, 17.0, 18.0, 20.0, 32.0, 44.0, 51.0, 70.0, 62.0, 64.0, 64.0, 57.0, 78.0, 62.0, 51.0, 47.0, 52.0, 39.0, 35.0, 18.0, 18.0, 19.0, 13.0, 3.0, 8.0, 7.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.9716796875, -0.939422607421875, -0.90716552734375, -0.874908447265625, -0.8426513671875, -0.810394287109375, -0.77813720703125, -0.745880126953125, -0.713623046875, -0.681365966796875, -0.64910888671875, -0.616851806640625, -0.5845947265625, -0.552337646484375, -0.52008056640625, -0.487823486328125, -0.45556640625, -0.423309326171875, -0.39105224609375, -0.358795166015625, -0.3265380859375, -0.294281005859375, -0.26202392578125, -0.229766845703125, -0.197509765625, -0.165252685546875, -0.13299560546875, -0.100738525390625, -0.0684814453125, -0.036224365234375, -0.00396728515625, 0.028289794921875, 0.060546875, 0.092803955078125, 0.12506103515625, 0.157318115234375, 0.1895751953125, 0.221832275390625, 0.25408935546875, 0.286346435546875, 0.318603515625, 0.350860595703125, 0.38311767578125, 0.415374755859375, 0.4476318359375, 0.479888916015625, 0.51214599609375, 0.544403076171875, 0.57666015625, 0.608917236328125, 0.64117431640625, 0.673431396484375, 0.7056884765625, 0.737945556640625, 0.77020263671875, 0.802459716796875, 0.834716796875, 0.866973876953125, 0.89923095703125, 0.931488037109375, 0.9637451171875, 0.996002197265625, 1.02825927734375, 1.060516357421875, 1.0927734375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 2.0, 4.0, 15.0, 10.0, 10.0, 19.0, 25.0, 33.0, 46.0, 75.0, 99.0, 139.0, 182.0, 253.0, 383.0, 682.0, 1146.0, 2166.0, 4221.0, 9329.0, 24707.0, 98071.0, 3856366.0, 144230.0, 30360.0, 10957.0, 4788.0, 2463.0, 1261.0, 769.0, 424.0, 319.0, 205.0, 149.0, 98.0, 79.0, 44.0, 31.0, 28.0, 20.0, 18.0, 17.0, 9.0, 2.0, 8.0, 4.0, 2.0, 8.0, 5.0, 1.0, 2.0], "bins": [-2.833984375, -2.754364013671875, -2.67474365234375, -2.595123291015625, -2.5155029296875, -2.435882568359375, -2.35626220703125, -2.276641845703125, -2.197021484375, -2.117401123046875, -2.03778076171875, -1.958160400390625, -1.8785400390625, -1.798919677734375, -1.71929931640625, -1.639678955078125, -1.56005859375, -1.480438232421875, -1.40081787109375, -1.321197509765625, -1.2415771484375, -1.161956787109375, -1.08233642578125, -1.002716064453125, -0.923095703125, -0.843475341796875, -0.76385498046875, -0.684234619140625, -0.6046142578125, -0.524993896484375, -0.44537353515625, -0.365753173828125, -0.2861328125, -0.206512451171875, -0.12689208984375, -0.047271728515625, 0.0323486328125, 0.111968994140625, 0.19158935546875, 0.271209716796875, 0.350830078125, 0.430450439453125, 0.51007080078125, 0.589691162109375, 0.6693115234375, 0.748931884765625, 0.82855224609375, 0.908172607421875, 0.98779296875, 1.067413330078125, 1.14703369140625, 1.226654052734375, 1.3062744140625, 1.385894775390625, 1.46551513671875, 1.545135498046875, 1.624755859375, 1.704376220703125, 1.78399658203125, 1.863616943359375, 1.9432373046875, 2.022857666015625, 2.10247802734375, 2.182098388671875, 2.26171875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 4.0, 5.0, 7.0, 9.0, 23.0, 45.0, 48.0, 156.0, 3257.0, 314.0, 84.0, 45.0, 28.0, 18.0, 7.0, 9.0, 8.0, 2.0, 5.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.220703125, -1.1884002685546875, -1.156097412109375, -1.1237945556640625, -1.09149169921875, -1.0591888427734375, -1.026885986328125, -0.9945831298828125, -0.9622802734375, -0.9299774169921875, -0.897674560546875, -0.8653717041015625, -0.83306884765625, -0.8007659912109375, -0.768463134765625, -0.7361602783203125, -0.703857421875, -0.6715545654296875, -0.639251708984375, -0.6069488525390625, -0.57464599609375, -0.5423431396484375, -0.510040283203125, -0.4777374267578125, -0.4454345703125, -0.4131317138671875, -0.380828857421875, -0.3485260009765625, -0.31622314453125, -0.2839202880859375, -0.251617431640625, -0.2193145751953125, -0.18701171875, -0.1547088623046875, -0.122406005859375, -0.0901031494140625, -0.05780029296875, -0.0254974365234375, 0.006805419921875, 0.0391082763671875, 0.0714111328125, 0.1037139892578125, 0.136016845703125, 0.1683197021484375, 0.20062255859375, 0.2329254150390625, 0.265228271484375, 0.2975311279296875, 0.329833984375, 0.3621368408203125, 0.394439697265625, 0.4267425537109375, 0.45904541015625, 0.4913482666015625, 0.523651123046875, 0.5559539794921875, 0.5882568359375, 0.6205596923828125, 0.652862548828125, 0.6851654052734375, 0.71746826171875, 0.7497711181640625, 0.782073974609375, 0.8143768310546875, 0.8466796875]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 8.0, 7.0, 13.0, 21.0, 37.0, 53.0, 54.0, 78.0, 92.0, 111.0, 98.0, 114.0, 97.0, 73.0, 60.0, 42.0, 12.0, 20.0, 6.0, 5.0, 5.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5895838737487793, -3.4941811561584473, -3.398778200149536, -3.303375482559204, -3.207972526550293, -3.112569808959961, -3.017167091369629, -2.9217641353607178, -2.8263611793518066, -2.7309584617614746, -2.6355555057525635, -2.5401527881622314, -2.4447498321533203, -2.3493471145629883, -2.2539443969726562, -2.158541440963745, -2.063138723373413, -1.9677358865737915, -1.87233304977417, -1.776930332183838, -1.6815273761749268, -1.5861246585845947, -1.4907218217849731, -1.3953189849853516, -1.29991614818573, -1.2045133113861084, -1.1091104745864868, -1.0137076377868652, -0.9183048605918884, -0.8229020237922668, -0.72749924659729, -0.6320964097976685, -0.5366935729980469, -0.4412907361984253, -0.3458879292011261, -0.2504851222038269, -0.15508228540420532, -0.05967944860458374, 0.035723328590393066, 0.13112616539001465, 0.22652900218963623, 0.3219318389892578, 0.417334645986557, 0.5127374529838562, 0.6081402897834778, 0.7035431265830994, 0.7989459037780762, 0.8943487405776978, 0.9897515773773193, 1.085154414176941, 1.1805572509765625, 1.2759599685668945, 1.3713629245758057, 1.4667656421661377, 1.5621684789657593, 1.6575713157653809, 1.7529741525650024, 1.848376989364624, 1.9437798261642456, 2.039182662963867, 2.134585380554199, 2.2299883365631104, 2.3253910541534424, 2.4207940101623535, 2.5161967277526855]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 5.0, 5.0, 3.0, 6.0, 6.0, 11.0, 22.0, 14.0, 28.0, 26.0, 26.0, 23.0, 32.0, 40.0, 32.0, 32.0, 45.0, 43.0, 40.0, 50.0, 46.0, 56.0, 40.0, 34.0, 55.0, 51.0, 36.0, 35.0, 29.0, 18.0, 23.0, 17.0, 19.0, 9.0, 7.0, 10.0, 7.0, 12.0, 4.0, 4.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.9960172176361084, -1.9374629259109497, -1.8789085149765015, -1.8203542232513428, -1.761799931526184, -1.7032456398010254, -1.6446912288665771, -1.5861369371414185, -1.5275826454162598, -1.469028353691101, -1.4104739427566528, -1.3519196510314941, -1.2933653593063354, -1.2348110675811768, -1.1762566566467285, -1.1177023649215698, -1.0591480731964111, -1.0005937814712524, -0.942039430141449, -0.8834850788116455, -0.8249307870864868, -0.7663764357566833, -0.7078220844268799, -0.6492677927017212, -0.590713381767273, -0.5321590304374695, -0.4736047387123108, -0.4150503873825073, -0.35649609565734863, -0.29794174432754517, -0.2393874228000641, -0.180833101272583, -0.12227880954742432, -0.06372448801994324, -0.005170159041881561, 0.053384169936180115, 0.1119384914636612, 0.17049282789230347, 0.22904714941978455, 0.2876014709472656, 0.3461557924747467, 0.4047101140022278, 0.46326443552970886, 0.5218187570571899, 0.5803731083869934, 0.6389274597167969, 0.6974817514419556, 0.7560360431671143, 0.8145903944969177, 0.8731447458267212, 0.9316990375518799, 0.9902533888816833, 1.0488077402114868, 1.1073620319366455, 1.1659163236618042, 1.224470615386963, 1.2830250263214111, 1.3415793180465698, 1.400133728981018, 1.4586880207061768, 1.5172423124313354, 1.5757966041564941, 1.6343510150909424, 1.692905306816101, 1.7514595985412598]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 5.0, 8.0, 4.0, 9.0, 17.0, 25.0, 42.0, 62.0, 69.0, 117.0, 172.0, 282.0, 449.0, 777.0, 1381.0, 2470.0, 4807.0, 10066.0, 22641.0, 56024.0, 140962.0, 288561.0, 283734.0, 138478.0, 54614.0, 22130.0, 9854.0, 4856.0, 2541.0, 1359.0, 757.0, 455.0, 291.0, 175.0, 122.0, 92.0, 45.0, 46.0, 17.0, 14.0, 13.0, 2.0, 6.0, 6.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.6904296875, -1.6358795166015625, -1.581329345703125, -1.5267791748046875, -1.47222900390625, -1.4176788330078125, -1.363128662109375, -1.3085784912109375, -1.2540283203125, -1.1994781494140625, -1.144927978515625, -1.0903778076171875, -1.03582763671875, -0.9812774658203125, -0.926727294921875, -0.8721771240234375, -0.817626953125, -0.7630767822265625, -0.708526611328125, -0.6539764404296875, -0.59942626953125, -0.5448760986328125, -0.490325927734375, -0.4357757568359375, -0.3812255859375, -0.3266754150390625, -0.272125244140625, -0.2175750732421875, -0.16302490234375, -0.1084747314453125, -0.053924560546875, 0.0006256103515625, 0.05517578125, 0.1097259521484375, 0.164276123046875, 0.2188262939453125, 0.27337646484375, 0.3279266357421875, 0.382476806640625, 0.4370269775390625, 0.4915771484375, 0.5461273193359375, 0.600677490234375, 0.6552276611328125, 0.70977783203125, 0.7643280029296875, 0.818878173828125, 0.8734283447265625, 0.927978515625, 0.9825286865234375, 1.037078857421875, 1.0916290283203125, 1.14617919921875, 1.2007293701171875, 1.255279541015625, 1.3098297119140625, 1.3643798828125, 1.4189300537109375, 1.473480224609375, 1.5280303955078125, 1.58258056640625, 1.6371307373046875, 1.691680908203125, 1.7462310791015625, 1.80078125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 5.0, 3.0, 7.0, 4.0, 9.0, 8.0, 11.0, 14.0, 19.0, 28.0, 34.0, 37.0, 42.0, 50.0, 55.0, 47.0, 65.0, 65.0, 67.0, 54.0, 53.0, 49.0, 46.0, 41.0, 42.0, 24.0, 32.0, 22.0, 16.0, 11.0, 9.0, 13.0, 3.0, 5.0, 0.0, 5.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.013671875, -0.9827423095703125, -0.951812744140625, -0.9208831787109375, -0.88995361328125, -0.8590240478515625, -0.828094482421875, -0.7971649169921875, -0.7662353515625, -0.7353057861328125, -0.704376220703125, -0.6734466552734375, -0.64251708984375, -0.6115875244140625, -0.580657958984375, -0.5497283935546875, -0.518798828125, -0.4878692626953125, -0.456939697265625, -0.4260101318359375, -0.39508056640625, -0.3641510009765625, -0.333221435546875, -0.3022918701171875, -0.2713623046875, -0.2404327392578125, -0.209503173828125, -0.1785736083984375, -0.14764404296875, -0.1167144775390625, -0.085784912109375, -0.0548553466796875, -0.02392578125, 0.0070037841796875, 0.037933349609375, 0.0688629150390625, 0.09979248046875, 0.1307220458984375, 0.161651611328125, 0.1925811767578125, 0.2235107421875, 0.2544403076171875, 0.285369873046875, 0.3162994384765625, 0.34722900390625, 0.3781585693359375, 0.409088134765625, 0.4400177001953125, 0.470947265625, 0.5018768310546875, 0.532806396484375, 0.5637359619140625, 0.59466552734375, 0.6255950927734375, 0.656524658203125, 0.6874542236328125, 0.7183837890625, 0.7493133544921875, 0.780242919921875, 0.8111724853515625, 0.84210205078125, 0.8730316162109375, 0.903961181640625, 0.9348907470703125, 0.9658203125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 2.0, 6.0, 3.0, 8.0, 14.0, 12.0, 18.0, 30.0, 44.0, 83.0, 136.0, 235.0, 446.0, 849.0, 2099.0, 5715.0, 21016.0, 114378.0, 597073.0, 252189.0, 39528.0, 9219.0, 2959.0, 1261.0, 565.0, 261.0, 135.0, 96.0, 46.0, 35.0, 22.0, 21.0, 18.0, 9.0, 10.0, 6.0, 4.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.89453125, -3.791229248046875, -3.68792724609375, -3.584625244140625, -3.4813232421875, -3.378021240234375, -3.27471923828125, -3.171417236328125, -3.068115234375, -2.964813232421875, -2.86151123046875, -2.758209228515625, -2.6549072265625, -2.551605224609375, -2.44830322265625, -2.345001220703125, -2.24169921875, -2.138397216796875, -2.03509521484375, -1.931793212890625, -1.8284912109375, -1.725189208984375, -1.62188720703125, -1.518585205078125, -1.415283203125, -1.311981201171875, -1.20867919921875, -1.105377197265625, -1.0020751953125, -0.898773193359375, -0.79547119140625, -0.692169189453125, -0.5888671875, -0.485565185546875, -0.38226318359375, -0.278961181640625, -0.1756591796875, -0.072357177734375, 0.03094482421875, 0.134246826171875, 0.237548828125, 0.340850830078125, 0.44415283203125, 0.547454833984375, 0.6507568359375, 0.754058837890625, 0.85736083984375, 0.960662841796875, 1.06396484375, 1.167266845703125, 1.27056884765625, 1.373870849609375, 1.4771728515625, 1.580474853515625, 1.68377685546875, 1.787078857421875, 1.890380859375, 1.993682861328125, 2.09698486328125, 2.200286865234375, 2.3035888671875, 2.406890869140625, 2.51019287109375, 2.613494873046875, 2.716796875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 2.0, 8.0, 9.0, 22.0, 28.0, 19.0, 33.0, 29.0, 39.0, 44.0, 64.0, 60.0, 56.0, 77.0, 72.0, 65.0, 68.0, 58.0, 50.0, 39.0, 34.0, 33.0, 27.0, 12.0, 16.0, 8.0, 10.0, 3.0, 4.0, 3.0, 2.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.7890625, -5.61956787109375, -5.4500732421875, -5.28057861328125, -5.111083984375, -4.94158935546875, -4.7720947265625, -4.60260009765625, -4.43310546875, -4.26361083984375, -4.0941162109375, -3.92462158203125, -3.755126953125, -3.58563232421875, -3.4161376953125, -3.24664306640625, -3.0771484375, -2.90765380859375, -2.7381591796875, -2.56866455078125, -2.399169921875, -2.22967529296875, -2.0601806640625, -1.89068603515625, -1.72119140625, -1.55169677734375, -1.3822021484375, -1.21270751953125, -1.043212890625, -0.87371826171875, -0.7042236328125, -0.53472900390625, -0.365234375, -0.19573974609375, -0.0262451171875, 0.14324951171875, 0.312744140625, 0.48223876953125, 0.6517333984375, 0.82122802734375, 0.99072265625, 1.16021728515625, 1.3297119140625, 1.49920654296875, 1.668701171875, 1.83819580078125, 2.0076904296875, 2.17718505859375, 2.3466796875, 2.51617431640625, 2.6856689453125, 2.85516357421875, 3.024658203125, 3.19415283203125, 3.3636474609375, 3.53314208984375, 3.70263671875, 3.87213134765625, 4.0416259765625, 4.21112060546875, 4.380615234375, 4.55010986328125, 4.7196044921875, 4.88909912109375, 5.05859375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 9.0, 16.0, 44.0, 49.0, 130.0, 250.0, 764.0, 2911.0, 26775.0, 885850.0, 123724.0, 6099.0, 1259.0, 376.0, 146.0, 70.0, 32.0, 24.0, 13.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.591796875, -3.4852294921875, -3.378662109375, -3.2720947265625, -3.16552734375, -3.0589599609375, -2.952392578125, -2.8458251953125, -2.7392578125, -2.6326904296875, -2.526123046875, -2.4195556640625, -2.31298828125, -2.2064208984375, -2.099853515625, -1.9932861328125, -1.88671875, -1.7801513671875, -1.673583984375, -1.5670166015625, -1.46044921875, -1.3538818359375, -1.247314453125, -1.1407470703125, -1.0341796875, -0.9276123046875, -0.821044921875, -0.7144775390625, -0.60791015625, -0.5013427734375, -0.394775390625, -0.2882080078125, -0.181640625, -0.0750732421875, 0.031494140625, 0.1380615234375, 0.24462890625, 0.3511962890625, 0.457763671875, 0.5643310546875, 0.6708984375, 0.7774658203125, 0.884033203125, 0.9906005859375, 1.09716796875, 1.2037353515625, 1.310302734375, 1.4168701171875, 1.5234375, 1.6300048828125, 1.736572265625, 1.8431396484375, 1.94970703125, 2.0562744140625, 2.162841796875, 2.2694091796875, 2.3759765625, 2.4825439453125, 2.589111328125, 2.6956787109375, 2.80224609375, 2.9088134765625, 3.015380859375, 3.1219482421875, 3.228515625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 5.0, 4.0, 14.0, 16.0, 20.0, 27.0, 34.0, 58.0, 77.0, 115.0, 125.0, 110.0, 112.0, 80.0, 59.0, 50.0, 34.0, 19.0, 11.0, 7.0, 7.0, 4.0, 7.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0002899169921875, -0.0002820640802383423, -0.00027421116828918457, -0.00026635825634002686, -0.00025850534439086914, -0.0002506524324417114, -0.0002427995204925537, -0.000234946608543396, -0.00022709369659423828, -0.00021924078464508057, -0.00021138787269592285, -0.00020353496074676514, -0.00019568204879760742, -0.0001878291368484497, -0.000179976224899292, -0.00017212331295013428, -0.00016427040100097656, -0.00015641748905181885, -0.00014856457710266113, -0.00014071166515350342, -0.0001328587532043457, -0.000125005841255188, -0.00011715292930603027, -0.00010930001735687256, -0.00010144710540771484, -9.359419345855713e-05, -8.574128150939941e-05, -7.78883695602417e-05, -7.003545761108398e-05, -6.218254566192627e-05, -5.4329633712768555e-05, -4.647672176361084e-05, -3.8623809814453125e-05, -3.077089786529541e-05, -2.2917985916137695e-05, -1.506507396697998e-05, -7.212162017822266e-06, 6.407499313354492e-07, 8.493661880493164e-06, 1.634657382965088e-05, 2.4199485778808594e-05, 3.205239772796631e-05, 3.9905309677124023e-05, 4.775822162628174e-05, 5.561113357543945e-05, 6.346404552459717e-05, 7.131695747375488e-05, 7.91698694229126e-05, 8.702278137207031e-05, 9.487569332122803e-05, 0.00010272860527038574, 0.00011058151721954346, 0.00011843442916870117, 0.0001262873411178589, 0.0001341402530670166, 0.00014199316501617432, 0.00014984607696533203, 0.00015769898891448975, 0.00016555190086364746, 0.00017340481281280518, 0.0001812577247619629, 0.0001891106367111206, 0.00019696354866027832, 0.00020481646060943604, 0.00021266937255859375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 4.0, 3.0, 5.0, 9.0, 10.0, 14.0, 19.0, 39.0, 74.0, 129.0, 281.0, 670.0, 2086.0, 13223.0, 422643.0, 588630.0, 16800.0, 2527.0, 727.0, 293.0, 146.0, 84.0, 68.0, 23.0, 18.0, 18.0, 4.0, 5.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.48046875, -2.388763427734375, -2.29705810546875, -2.205352783203125, -2.1136474609375, -2.021942138671875, -1.93023681640625, -1.838531494140625, -1.746826171875, -1.655120849609375, -1.56341552734375, -1.471710205078125, -1.3800048828125, -1.288299560546875, -1.19659423828125, -1.104888916015625, -1.01318359375, -0.921478271484375, -0.82977294921875, -0.738067626953125, -0.6463623046875, -0.554656982421875, -0.46295166015625, -0.371246337890625, -0.279541015625, -0.187835693359375, -0.09613037109375, -0.004425048828125, 0.0872802734375, 0.178985595703125, 0.27069091796875, 0.362396240234375, 0.4541015625, 0.545806884765625, 0.63751220703125, 0.729217529296875, 0.8209228515625, 0.912628173828125, 1.00433349609375, 1.096038818359375, 1.187744140625, 1.279449462890625, 1.37115478515625, 1.462860107421875, 1.5545654296875, 1.646270751953125, 1.73797607421875, 1.829681396484375, 1.92138671875, 2.013092041015625, 2.10479736328125, 2.196502685546875, 2.2882080078125, 2.379913330078125, 2.47161865234375, 2.563323974609375, 2.655029296875, 2.746734619140625, 2.83843994140625, 2.930145263671875, 3.0218505859375, 3.113555908203125, 3.20526123046875, 3.296966552734375, 3.388671875]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 3.0, 11.0, 23.0, 66.0, 116.0, 190.0, 215.0, 177.0, 111.0, 39.0, 19.0, 12.0, 8.0, 9.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.44921875, -2.3228759765625, -2.196533203125, -2.0701904296875, -1.94384765625, -1.8175048828125, -1.691162109375, -1.5648193359375, -1.4384765625, -1.3121337890625, -1.185791015625, -1.0594482421875, -0.93310546875, -0.8067626953125, -0.680419921875, -0.5540771484375, -0.427734375, -0.3013916015625, -0.175048828125, -0.0487060546875, 0.07763671875, 0.2039794921875, 0.330322265625, 0.4566650390625, 0.5830078125, 0.7093505859375, 0.835693359375, 0.9620361328125, 1.08837890625, 1.2147216796875, 1.341064453125, 1.4674072265625, 1.59375, 1.7200927734375, 1.846435546875, 1.9727783203125, 2.09912109375, 2.2254638671875, 2.351806640625, 2.4781494140625, 2.6044921875, 2.7308349609375, 2.857177734375, 2.9835205078125, 3.10986328125, 3.2362060546875, 3.362548828125, 3.4888916015625, 3.615234375, 3.7415771484375, 3.867919921875, 3.9942626953125, 4.12060546875, 4.2469482421875, 4.373291015625, 4.4996337890625, 4.6259765625, 4.7523193359375, 4.878662109375, 5.0050048828125, 5.13134765625, 5.2576904296875, 5.384033203125, 5.5103759765625, 5.63671875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 22.0, 144.0, 469.0, 318.0, 48.0, 9.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-162.7418975830078, -159.59458923339844, -156.447265625, -153.29995727539062, -150.1526336669922, -147.0053253173828, -143.85800170898438, -140.710693359375, -137.56338500976562, -134.41607666015625, -131.2687530517578, -128.12144470214844, -124.97412872314453, -121.82681274414062, -118.67949676513672, -115.53218078613281, -112.3848648071289, -109.237548828125, -106.0902328491211, -102.94291687011719, -99.79560852050781, -96.6482925415039, -93.5009765625, -90.3536605834961, -87.20634460449219, -84.05902862548828, -80.91171264648438, -77.764404296875, -74.6170883178711, -71.46977233886719, -68.32245635986328, -65.17514038085938, -62.02782440185547, -58.88050842285156, -55.73319625854492, -52.585880279541016, -49.438568115234375, -46.29125213623047, -43.14393615722656, -39.996620178222656, -36.849308013916016, -33.70199203491211, -30.55467987060547, -27.407363891601562, -24.26004981994629, -21.112735748291016, -17.96541976928711, -14.818105697631836, -11.670791625976562, -8.523477554321289, -5.376162528991699, -2.2288475036621094, 0.9184665679931641, 4.0657806396484375, 7.213096618652344, 10.360410690307617, 13.50772476196289, 16.655038833618164, 19.802352905273438, 22.949668884277344, 26.096982955932617, 29.24429702758789, 32.3916130065918, 35.53892517089844, 38.686241149902344]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 6.0, 6.0, 7.0, 6.0, 16.0, 16.0, 14.0, 22.0, 19.0, 11.0, 22.0, 30.0, 33.0, 40.0, 45.0, 48.0, 58.0, 50.0, 48.0, 51.0, 53.0, 47.0, 52.0, 41.0, 38.0, 45.0, 24.0, 31.0, 21.0, 19.0, 19.0, 17.0, 10.0, 10.0, 5.0, 4.0, 4.0, 9.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.56472396850586, -15.96933650970459, -15.373950004577637, -14.778562545776367, -14.183176040649414, -13.587788581848145, -12.992401123046875, -12.397014617919922, -11.801627159118652, -11.206239700317383, -10.61085319519043, -10.01546573638916, -9.42007827758789, -8.824691772460938, -8.229304313659668, -7.633917331695557, -7.038530349731445, -6.443143367767334, -5.847756385803223, -5.252368927001953, -4.656981945037842, -4.0615949630737305, -3.46620774269104, -2.8708205223083496, -2.2754335403442383, -1.6800464391708374, -1.0846593379974365, -0.48927223682403564, 0.10611486434936523, 0.7015018463134766, 1.296889066696167, 1.8922762870788574, 2.4876632690429688, 3.08305025100708, 3.6784374713897705, 4.273824691772461, 4.869211673736572, 5.464598655700684, 6.059986114501953, 6.6553730964660645, 7.250760078430176, 7.846147060394287, 8.441534042358398, 9.036921501159668, 9.632308959960938, 10.22769546508789, 10.82308292388916, 11.41847038269043, 12.013856887817383, 12.609244346618652, 13.204630851745605, 13.800018310546875, 14.395404815673828, 14.990792274475098, 15.586179733276367, 16.18156623840332, 16.776954650878906, 17.37234115600586, 17.967729568481445, 18.5631160736084, 19.15850257873535, 19.753890991210938, 20.34927749633789, 20.944664001464844, 21.540050506591797]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 3.0, 11.0, 8.0, 23.0, 30.0, 40.0, 65.0, 73.0, 138.0, 194.0, 369.0, 730.0, 1420.0, 3324.0, 9262.0, 49579.0, 4093969.0, 23942.0, 6153.0, 2393.0, 1069.0, 602.0, 322.0, 194.0, 120.0, 71.0, 63.0, 31.0, 22.0, 9.0, 13.0, 9.0, 10.0, 2.0, 7.0, 3.0, 7.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.76171875, -4.61883544921875, -4.4759521484375, -4.33306884765625, -4.190185546875, -4.04730224609375, -3.9044189453125, -3.76153564453125, -3.61865234375, -3.47576904296875, -3.3328857421875, -3.19000244140625, -3.047119140625, -2.90423583984375, -2.7613525390625, -2.61846923828125, -2.4755859375, -2.33270263671875, -2.1898193359375, -2.04693603515625, -1.904052734375, -1.76116943359375, -1.6182861328125, -1.47540283203125, -1.33251953125, -1.18963623046875, -1.0467529296875, -0.90386962890625, -0.760986328125, -0.61810302734375, -0.4752197265625, -0.33233642578125, -0.189453125, -0.04656982421875, 0.0963134765625, 0.23919677734375, 0.382080078125, 0.52496337890625, 0.6678466796875, 0.81072998046875, 0.95361328125, 1.09649658203125, 1.2393798828125, 1.38226318359375, 1.525146484375, 1.66802978515625, 1.8109130859375, 1.95379638671875, 2.0966796875, 2.23956298828125, 2.3824462890625, 2.52532958984375, 2.668212890625, 2.81109619140625, 2.9539794921875, 3.09686279296875, 3.23974609375, 3.38262939453125, 3.5255126953125, 3.66839599609375, 3.811279296875, 3.95416259765625, 4.0970458984375, 4.23992919921875, 4.3828125]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 4.0, 5.0, 5.0, 11.0, 9.0, 9.0, 20.0, 20.0, 27.0, 32.0, 39.0, 58.0, 53.0, 65.0, 61.0, 62.0, 83.0, 54.0, 68.0, 56.0, 40.0, 41.0, 39.0, 25.0, 35.0, 20.0, 18.0, 13.0, 6.0, 6.0, 4.0, 3.0, 5.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.95361328125, -0.9173049926757812, -0.8809967041015625, -0.8446884155273438, -0.808380126953125, -0.7720718383789062, -0.7357635498046875, -0.6994552612304688, -0.66314697265625, -0.6268386840820312, -0.5905303955078125, -0.5542221069335938, -0.517913818359375, -0.48160552978515625, -0.4452972412109375, -0.40898895263671875, -0.3726806640625, -0.33637237548828125, -0.3000640869140625, -0.26375579833984375, -0.227447509765625, -0.19113922119140625, -0.1548309326171875, -0.11852264404296875, -0.08221435546875, -0.04590606689453125, -0.0095977783203125, 0.02671051025390625, 0.063018798828125, 0.09932708740234375, 0.1356353759765625, 0.17194366455078125, 0.208251953125, 0.24456024169921875, 0.2808685302734375, 0.31717681884765625, 0.353485107421875, 0.38979339599609375, 0.4261016845703125, 0.46240997314453125, 0.49871826171875, 0.5350265502929688, 0.5713348388671875, 0.6076431274414062, 0.643951416015625, 0.6802597045898438, 0.7165679931640625, 0.7528762817382812, 0.7891845703125, 0.8254928588867188, 0.8618011474609375, 0.8981094360351562, 0.934417724609375, 0.9707260131835938, 1.0070343017578125, 1.0433425903320312, 1.07965087890625, 1.1159591674804688, 1.1522674560546875, 1.1885757446289062, 1.224884033203125, 1.2611923217773438, 1.2975006103515625, 1.3338088989257812, 1.3701171875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 7.0, 7.0, 9.0, 13.0, 11.0, 11.0, 14.0, 34.0, 46.0, 52.0, 87.0, 118.0, 159.0, 269.0, 364.0, 598.0, 925.0, 1679.0, 3008.0, 6455.0, 16747.0, 84031.0, 4020331.0, 37538.0, 10906.0, 4760.0, 2367.0, 1349.0, 793.0, 513.0, 323.0, 216.0, 155.0, 106.0, 80.0, 46.0, 43.0, 27.0, 23.0, 16.0, 10.0, 14.0, 8.0, 4.0, 7.0, 0.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.01953125, -3.89111328125, -3.7626953125, -3.63427734375, -3.505859375, -3.37744140625, -3.2490234375, -3.12060546875, -2.9921875, -2.86376953125, -2.7353515625, -2.60693359375, -2.478515625, -2.35009765625, -2.2216796875, -2.09326171875, -1.96484375, -1.83642578125, -1.7080078125, -1.57958984375, -1.451171875, -1.32275390625, -1.1943359375, -1.06591796875, -0.9375, -0.80908203125, -0.6806640625, -0.55224609375, -0.423828125, -0.29541015625, -0.1669921875, -0.03857421875, 0.08984375, 0.21826171875, 0.3466796875, 0.47509765625, 0.603515625, 0.73193359375, 0.8603515625, 0.98876953125, 1.1171875, 1.24560546875, 1.3740234375, 1.50244140625, 1.630859375, 1.75927734375, 1.8876953125, 2.01611328125, 2.14453125, 2.27294921875, 2.4013671875, 2.52978515625, 2.658203125, 2.78662109375, 2.9150390625, 3.04345703125, 3.171875, 3.30029296875, 3.4287109375, 3.55712890625, 3.685546875, 3.81396484375, 3.9423828125, 4.07080078125, 4.19921875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 2.0, 2.0, 5.0, 11.0, 18.0, 19.0, 29.0, 52.0, 341.0, 3439.0, 56.0, 32.0, 22.0, 8.0, 7.0, 4.0, 6.0, 6.0, 5.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.99755859375, -0.9632034301757812, -0.9288482666015625, -0.8944931030273438, -0.860137939453125, -0.8257827758789062, -0.7914276123046875, -0.7570724487304688, -0.72271728515625, -0.6883621215820312, -0.6540069580078125, -0.6196517944335938, -0.585296630859375, -0.5509414672851562, -0.5165863037109375, -0.48223114013671875, -0.4478759765625, -0.41352081298828125, -0.3791656494140625, -0.34481048583984375, -0.310455322265625, -0.27610015869140625, -0.2417449951171875, -0.20738983154296875, -0.17303466796875, -0.13867950439453125, -0.1043243408203125, -0.06996917724609375, -0.035614013671875, -0.00125885009765625, 0.0330963134765625, 0.06745147705078125, 0.101806640625, 0.13616180419921875, 0.1705169677734375, 0.20487213134765625, 0.239227294921875, 0.27358245849609375, 0.3079376220703125, 0.34229278564453125, 0.37664794921875, 0.41100311279296875, 0.4453582763671875, 0.47971343994140625, 0.514068603515625, 0.5484237670898438, 0.5827789306640625, 0.6171340942382812, 0.6514892578125, 0.6858444213867188, 0.7201995849609375, 0.7545547485351562, 0.788909912109375, 0.8232650756835938, 0.8576202392578125, 0.8919754028320312, 0.92633056640625, 0.9606857299804688, 0.9950408935546875, 1.0293960571289062, 1.063751220703125, 1.0981063842773438, 1.1324615478515625, 1.1668167114257812, 1.201171875]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 21.0, 39.0, 91.0, 206.0, 239.0, 196.0, 105.0, 66.0, 24.0, 14.0, 7.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.39384126663208, -6.150108337402344, -5.906374931335449, -5.662641525268555, -5.418908596038818, -5.175175666809082, -4.9314422607421875, -4.687708854675293, -4.443975925445557, -4.20024299621582, -3.956509590148926, -3.7127764225006104, -3.469043254852295, -3.2253100872039795, -2.981576919555664, -2.7378437519073486, -2.494110584259033, -2.2503774166107178, -2.0066442489624023, -1.762911081314087, -1.5191779136657715, -1.275444746017456, -1.0317115783691406, -0.7879784107208252, -0.5442452430725098, -0.30051207542419434, -0.056778907775878906, 0.18695425987243652, 0.43068742752075195, 0.6744205951690674, 0.9181537628173828, 1.1618869304656982, 1.4056196212768555, 1.649352788925171, 1.8930859565734863, 2.1368191242218018, 2.380552291870117, 2.6242854595184326, 2.868018627166748, 3.1117517948150635, 3.355484962463379, 3.5992181301116943, 3.8429512977600098, 4.086684226989746, 4.330417633056641, 4.574151039123535, 4.8178839683532715, 5.061616897583008, 5.305350303649902, 5.549083709716797, 5.792816638946533, 6.0365495681762695, 6.280282974243164, 6.524016380310059, 6.767749309539795, 7.011482238769531, 7.255215644836426, 7.49894905090332, 7.742681980133057, 7.986414909362793, 8.230148315429688, 8.473881721496582, 8.717615127563477, 8.961347579956055, 9.20508098602295]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 2.0, 11.0, 6.0, 5.0, 10.0, 15.0, 18.0, 16.0, 14.0, 21.0, 28.0, 28.0, 30.0, 36.0, 35.0, 44.0, 30.0, 46.0, 39.0, 59.0, 41.0, 43.0, 35.0, 48.0, 35.0, 42.0, 33.0, 32.0, 39.0, 31.0, 27.0, 20.0, 13.0, 11.0, 17.0, 7.0, 11.0, 10.0, 1.0, 6.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.346281051635742, -2.2719013690948486, -2.197521686553955, -2.1231422424316406, -2.048762559890747, -1.9743828773498535, -1.9000033140182495, -1.8256237506866455, -1.751244068145752, -1.6768643856048584, -1.6024848222732544, -1.5281052589416504, -1.4537255764007568, -1.3793458938598633, -1.3049663305282593, -1.2305867671966553, -1.1562070846557617, -1.0818274021148682, -1.0074478387832642, -0.9330682158470154, -0.8586885929107666, -0.7843089699745178, -0.709929347038269, -0.6355497241020203, -0.5611701011657715, -0.4867904782295227, -0.4124108552932739, -0.33803123235702515, -0.26365160942077637, -0.1892719864845276, -0.11489236354827881, -0.04051274061203003, 0.03386688232421875, 0.10824650526046753, 0.1826261281967163, 0.2570057511329651, 0.33138537406921387, 0.40576499700546265, 0.4801446199417114, 0.5545242428779602, 0.628903865814209, 0.7032834887504578, 0.7776631116867065, 0.8520427346229553, 0.9264223575592041, 1.0008020401000977, 1.0751816034317017, 1.1495611667633057, 1.2239408493041992, 1.2983205318450928, 1.3727000951766968, 1.4470796585083008, 1.5214593410491943, 1.595839023590088, 1.670218586921692, 1.744598150253296, 1.8189778327941895, 1.893357515335083, 1.967737078666687, 2.042116641998291, 2.1164963245391846, 2.190876007080078, 2.2652554512023926, 2.339635133743286, 2.4140148162841797]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 8.0, 12.0, 16.0, 22.0, 43.0, 64.0, 120.0, 191.0, 319.0, 535.0, 1020.0, 1889.0, 3768.0, 8104.0, 18634.0, 47976.0, 132487.0, 323040.0, 309211.0, 123371.0, 44908.0, 17735.0, 7438.0, 3576.0, 1767.0, 945.0, 581.0, 321.0, 175.0, 99.0, 61.0, 46.0, 26.0, 15.0, 13.0, 10.0, 4.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9716796875, -1.9080047607421875, -1.844329833984375, -1.7806549072265625, -1.71697998046875, -1.6533050537109375, -1.589630126953125, -1.5259552001953125, -1.4622802734375, -1.3986053466796875, -1.334930419921875, -1.2712554931640625, -1.20758056640625, -1.1439056396484375, -1.080230712890625, -1.0165557861328125, -0.952880859375, -0.8892059326171875, -0.825531005859375, -0.7618560791015625, -0.69818115234375, -0.6345062255859375, -0.570831298828125, -0.5071563720703125, -0.4434814453125, -0.3798065185546875, -0.316131591796875, -0.2524566650390625, -0.18878173828125, -0.1251068115234375, -0.061431884765625, 0.0022430419921875, 0.06591796875, 0.1295928955078125, 0.193267822265625, 0.2569427490234375, 0.32061767578125, 0.3842926025390625, 0.447967529296875, 0.5116424560546875, 0.5753173828125, 0.6389923095703125, 0.702667236328125, 0.7663421630859375, 0.83001708984375, 0.8936920166015625, 0.957366943359375, 1.0210418701171875, 1.084716796875, 1.1483917236328125, 1.212066650390625, 1.2757415771484375, 1.33941650390625, 1.4030914306640625, 1.466766357421875, 1.5304412841796875, 1.5941162109375, 1.6577911376953125, 1.721466064453125, 1.7851409912109375, 1.84881591796875, 1.9124908447265625, 1.976165771484375, 2.0398406982421875, 2.103515625]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 4.0, 5.0, 7.0, 13.0, 11.0, 9.0, 14.0, 16.0, 38.0, 29.0, 28.0, 44.0, 40.0, 45.0, 46.0, 61.0, 49.0, 57.0, 54.0, 62.0, 46.0, 44.0, 31.0, 40.0, 40.0, 34.0, 20.0, 31.0, 21.0, 9.0, 8.0, 15.0, 4.0, 5.0, 7.0, 4.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.95361328125, -0.9202651977539062, -0.8869171142578125, -0.8535690307617188, -0.820220947265625, -0.7868728637695312, -0.7535247802734375, -0.7201766967773438, -0.68682861328125, -0.6534805297851562, -0.6201324462890625, -0.5867843627929688, -0.553436279296875, -0.5200881958007812, -0.4867401123046875, -0.45339202880859375, -0.4200439453125, -0.38669586181640625, -0.3533477783203125, -0.31999969482421875, -0.286651611328125, -0.25330352783203125, -0.2199554443359375, -0.18660736083984375, -0.15325927734375, -0.11991119384765625, -0.0865631103515625, -0.05321502685546875, -0.019866943359375, 0.01348114013671875, 0.0468292236328125, 0.08017730712890625, 0.113525390625, 0.14687347412109375, 0.1802215576171875, 0.21356964111328125, 0.246917724609375, 0.28026580810546875, 0.3136138916015625, 0.34696197509765625, 0.38031005859375, 0.41365814208984375, 0.4470062255859375, 0.48035430908203125, 0.513702392578125, 0.5470504760742188, 0.5803985595703125, 0.6137466430664062, 0.6470947265625, 0.6804428100585938, 0.7137908935546875, 0.7471389770507812, 0.780487060546875, 0.8138351440429688, 0.8471832275390625, 0.8805313110351562, 0.91387939453125, 0.9472274780273438, 0.9805755615234375, 1.0139236450195312, 1.047271728515625, 1.0806198120117188, 1.1139678955078125, 1.1473159790039062, 1.1806640625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 5.0, 3.0, 1.0, 7.0, 6.0, 7.0, 15.0, 15.0, 22.0, 38.0, 68.0, 107.0, 187.0, 388.0, 927.0, 2962.0, 13700.0, 104296.0, 716800.0, 181686.0, 21092.0, 4028.0, 1187.0, 456.0, 192.0, 140.0, 71.0, 51.0, 24.0, 18.0, 11.0, 8.0, 10.0, 5.0, 5.0, 5.0, 7.0, 3.0, 5.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.01953125, -3.89239501953125, -3.7652587890625, -3.63812255859375, -3.510986328125, -3.38385009765625, -3.2567138671875, -3.12957763671875, -3.00244140625, -2.87530517578125, -2.7481689453125, -2.62103271484375, -2.493896484375, -2.36676025390625, -2.2396240234375, -2.11248779296875, -1.9853515625, -1.85821533203125, -1.7310791015625, -1.60394287109375, -1.476806640625, -1.34967041015625, -1.2225341796875, -1.09539794921875, -0.96826171875, -0.84112548828125, -0.7139892578125, -0.58685302734375, -0.459716796875, -0.33258056640625, -0.2054443359375, -0.07830810546875, 0.048828125, 0.17596435546875, 0.3031005859375, 0.43023681640625, 0.557373046875, 0.68450927734375, 0.8116455078125, 0.93878173828125, 1.06591796875, 1.19305419921875, 1.3201904296875, 1.44732666015625, 1.574462890625, 1.70159912109375, 1.8287353515625, 1.95587158203125, 2.0830078125, 2.21014404296875, 2.3372802734375, 2.46441650390625, 2.591552734375, 2.71868896484375, 2.8458251953125, 2.97296142578125, 3.10009765625, 3.22723388671875, 3.3543701171875, 3.48150634765625, 3.608642578125, 3.73577880859375, 3.8629150390625, 3.99005126953125, 4.1171875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 0.0, 4.0, 2.0, 4.0, 11.0, 4.0, 13.0, 13.0, 12.0, 13.0, 20.0, 11.0, 25.0, 27.0, 20.0, 31.0, 34.0, 40.0, 37.0, 37.0, 51.0, 44.0, 39.0, 43.0, 36.0, 36.0, 37.0, 45.0, 40.0, 36.0, 30.0, 27.0, 23.0, 24.0, 15.0, 23.0, 19.0, 14.0, 13.0, 10.0, 7.0, 12.0, 4.0, 2.0, 3.0, 5.0, 2.0, 4.0, 2.0, 1.0, 0.0, 4.0], "bins": [-4.046875, -3.93145751953125, -3.8160400390625, -3.70062255859375, -3.585205078125, -3.46978759765625, -3.3543701171875, -3.23895263671875, -3.12353515625, -3.00811767578125, -2.8927001953125, -2.77728271484375, -2.661865234375, -2.54644775390625, -2.4310302734375, -2.31561279296875, -2.2001953125, -2.08477783203125, -1.9693603515625, -1.85394287109375, -1.738525390625, -1.62310791015625, -1.5076904296875, -1.39227294921875, -1.27685546875, -1.16143798828125, -1.0460205078125, -0.93060302734375, -0.815185546875, -0.69976806640625, -0.5843505859375, -0.46893310546875, -0.353515625, -0.23809814453125, -0.1226806640625, -0.00726318359375, 0.108154296875, 0.22357177734375, 0.3389892578125, 0.45440673828125, 0.56982421875, 0.68524169921875, 0.8006591796875, 0.91607666015625, 1.031494140625, 1.14691162109375, 1.2623291015625, 1.37774658203125, 1.4931640625, 1.60858154296875, 1.7239990234375, 1.83941650390625, 1.954833984375, 2.07025146484375, 2.1856689453125, 2.30108642578125, 2.41650390625, 2.53192138671875, 2.6473388671875, 2.76275634765625, 2.878173828125, 2.99359130859375, 3.1090087890625, 3.22442626953125, 3.33984375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 5.0, 4.0, 6.0, 14.0, 15.0, 22.0, 51.0, 51.0, 62.0, 139.0, 328.0, 828.0, 2826.0, 15529.0, 343292.0, 656704.0, 23356.0, 3529.0, 970.0, 408.0, 169.0, 103.0, 50.0, 25.0, 23.0, 16.0, 10.0, 5.0, 4.0, 7.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.44921875, -3.3536376953125, -3.258056640625, -3.1624755859375, -3.06689453125, -2.9713134765625, -2.875732421875, -2.7801513671875, -2.6845703125, -2.5889892578125, -2.493408203125, -2.3978271484375, -2.30224609375, -2.2066650390625, -2.111083984375, -2.0155029296875, -1.919921875, -1.8243408203125, -1.728759765625, -1.6331787109375, -1.53759765625, -1.4420166015625, -1.346435546875, -1.2508544921875, -1.1552734375, -1.0596923828125, -0.964111328125, -0.8685302734375, -0.77294921875, -0.6773681640625, -0.581787109375, -0.4862060546875, -0.390625, -0.2950439453125, -0.199462890625, -0.1038818359375, -0.00830078125, 0.0872802734375, 0.182861328125, 0.2784423828125, 0.3740234375, 0.4696044921875, 0.565185546875, 0.6607666015625, 0.75634765625, 0.8519287109375, 0.947509765625, 1.0430908203125, 1.138671875, 1.2342529296875, 1.329833984375, 1.4254150390625, 1.52099609375, 1.6165771484375, 1.712158203125, 1.8077392578125, 1.9033203125, 1.9989013671875, 2.094482421875, 2.1900634765625, 2.28564453125, 2.3812255859375, 2.476806640625, 2.5723876953125, 2.66796875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 6.0, 8.0, 8.0, 11.0, 15.0, 27.0, 29.0, 54.0, 66.0, 86.0, 107.0, 119.0, 104.0, 92.0, 76.0, 41.0, 31.0, 37.0, 16.0, 14.0, 10.0, 10.0, 8.0, 5.0, 5.0, 5.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.00029087066650390625, -0.0002825148403644562, -0.0002741590142250061, -0.00026580318808555603, -0.00025744736194610596, -0.0002490915358066559, -0.0002407357096672058, -0.00023237988352775574, -0.00022402405738830566, -0.0002156682312488556, -0.00020731240510940552, -0.00019895657896995544, -0.00019060075283050537, -0.0001822449266910553, -0.00017388910055160522, -0.00016553327441215515, -0.00015717744827270508, -0.000148821622133255, -0.00014046579599380493, -0.00013210996985435486, -0.00012375414371490479, -0.00011539831757545471, -0.00010704249143600464, -9.868666529655457e-05, -9.033083915710449e-05, -8.197501301765442e-05, -7.361918687820435e-05, -6.526336073875427e-05, -5.69075345993042e-05, -4.8551708459854126e-05, -4.019588232040405e-05, -3.184005618095398e-05, -2.3484230041503906e-05, -1.5128403902053833e-05, -6.77257776260376e-06, 1.5832483768463135e-06, 9.939074516296387e-06, 1.829490065574646e-05, 2.6650726795196533e-05, 3.5006552934646606e-05, 4.336237907409668e-05, 5.171820521354675e-05, 6.0074031352996826e-05, 6.84298574924469e-05, 7.678568363189697e-05, 8.514150977134705e-05, 9.349733591079712e-05, 0.00010185316205024719, 0.00011020898818969727, 0.00011856481432914734, 0.0001269206404685974, 0.00013527646660804749, 0.00014363229274749756, 0.00015198811888694763, 0.0001603439450263977, 0.00016869977116584778, 0.00017705559730529785, 0.00018541142344474792, 0.000193767249584198, 0.00020212307572364807, 0.00021047890186309814, 0.00021883472800254822, 0.0002271905541419983, 0.00023554638028144836, 0.00024390220642089844]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 8.0, 7.0, 17.0, 22.0, 35.0, 58.0, 109.0, 215.0, 465.0, 1297.0, 5242.0, 48450.0, 876484.0, 105370.0, 7906.0, 1754.0, 585.0, 241.0, 122.0, 75.0, 38.0, 24.0, 15.0, 9.0, 8.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.46875, -4.36859130859375, -4.2684326171875, -4.16827392578125, -4.068115234375, -3.96795654296875, -3.8677978515625, -3.76763916015625, -3.66748046875, -3.56732177734375, -3.4671630859375, -3.36700439453125, -3.266845703125, -3.16668701171875, -3.0665283203125, -2.96636962890625, -2.8662109375, -2.76605224609375, -2.6658935546875, -2.56573486328125, -2.465576171875, -2.36541748046875, -2.2652587890625, -2.16510009765625, -2.06494140625, -1.96478271484375, -1.8646240234375, -1.76446533203125, -1.664306640625, -1.56414794921875, -1.4639892578125, -1.36383056640625, -1.263671875, -1.16351318359375, -1.0633544921875, -0.96319580078125, -0.863037109375, -0.76287841796875, -0.6627197265625, -0.56256103515625, -0.46240234375, -0.36224365234375, -0.2620849609375, -0.16192626953125, -0.061767578125, 0.03839111328125, 0.1385498046875, 0.23870849609375, 0.3388671875, 0.43902587890625, 0.5391845703125, 0.63934326171875, 0.739501953125, 0.83966064453125, 0.9398193359375, 1.03997802734375, 1.14013671875, 1.24029541015625, 1.3404541015625, 1.44061279296875, 1.540771484375, 1.64093017578125, 1.7410888671875, 1.84124755859375, 1.94140625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 7.0, 4.0, 9.0, 15.0, 23.0, 36.0, 83.0, 115.0, 163.0, 161.0, 128.0, 108.0, 67.0, 31.0, 28.0, 12.0, 11.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-3.78515625, -3.686370849609375, -3.58758544921875, -3.488800048828125, -3.3900146484375, -3.291229248046875, -3.19244384765625, -3.093658447265625, -2.994873046875, -2.896087646484375, -2.79730224609375, -2.698516845703125, -2.5997314453125, -2.500946044921875, -2.40216064453125, -2.303375244140625, -2.20458984375, -2.105804443359375, -2.00701904296875, -1.908233642578125, -1.8094482421875, -1.710662841796875, -1.61187744140625, -1.513092041015625, -1.414306640625, -1.315521240234375, -1.21673583984375, -1.117950439453125, -1.0191650390625, -0.920379638671875, -0.82159423828125, -0.722808837890625, -0.6240234375, -0.525238037109375, -0.42645263671875, -0.327667236328125, -0.2288818359375, -0.130096435546875, -0.03131103515625, 0.067474365234375, 0.166259765625, 0.265045166015625, 0.36383056640625, 0.462615966796875, 0.5614013671875, 0.660186767578125, 0.75897216796875, 0.857757568359375, 0.95654296875, 1.055328369140625, 1.15411376953125, 1.252899169921875, 1.3516845703125, 1.450469970703125, 1.54925537109375, 1.648040771484375, 1.746826171875, 1.845611572265625, 1.94439697265625, 2.043182373046875, 2.1419677734375, 2.240753173828125, 2.33953857421875, 2.438323974609375, 2.537109375]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 4.0, 9.0, 24.0, 93.0, 269.0, 346.0, 185.0, 49.0, 16.0, 7.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-113.35630798339844, -111.19064331054688, -109.02497100830078, -106.85930633544922, -104.69363403320312, -102.52796936035156, -100.36229705810547, -98.1966323852539, -96.03096008300781, -93.86529541015625, -91.69962310791016, -89.5339584350586, -87.3682861328125, -85.20262145996094, -83.03694915771484, -80.87128448486328, -78.70561981201172, -76.53995513916016, -74.37428283691406, -72.2086181640625, -70.0429458618164, -67.87728118896484, -65.71160888671875, -63.54594421386719, -61.38027572631836, -59.21460723876953, -57.0489387512207, -54.883270263671875, -52.71760559082031, -50.55193328857422, -48.386268615722656, -46.22060012817383, -44.054927825927734, -41.889259338378906, -39.72359085083008, -37.55792236328125, -35.39225769042969, -33.226585388183594, -31.06092071533203, -28.895252227783203, -26.729583740234375, -24.563915252685547, -22.39824676513672, -20.232580184936523, -18.066911697387695, -15.901243209838867, -13.735575675964355, -11.569908142089844, -9.404239654541016, -7.238571643829346, -5.072903633117676, -2.907235622406006, -0.7415676116943359, 1.4241008758544922, 3.589768409729004, 5.755435943603516, 7.921104431152344, 10.086772918701172, 12.252440452575684, 14.418107986450195, 16.583776473999023, 18.74944496154785, 20.915111541748047, 23.080780029296875, 25.246448516845703]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 7.0, 1.0, 11.0, 11.0, 19.0, 15.0, 22.0, 21.0, 29.0, 34.0, 42.0, 37.0, 37.0, 47.0, 39.0, 59.0, 63.0, 60.0, 53.0, 45.0, 55.0, 43.0, 29.0, 39.0, 31.0, 29.0, 18.0, 21.0, 9.0, 18.0, 14.0, 8.0, 6.0, 4.0, 6.0, 4.0, 7.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-23.170543670654297, -22.52720069885254, -21.88385581970215, -21.24051284790039, -20.597169876098633, -19.953826904296875, -19.310482025146484, -18.667139053344727, -18.02379608154297, -17.38045310974121, -16.73710823059082, -16.093765258789062, -15.450422286987305, -14.80707836151123, -14.163734436035156, -13.520391464233398, -12.877047538757324, -12.23370361328125, -11.590360641479492, -10.947016716003418, -10.30367374420166, -9.660329818725586, -9.016986846923828, -8.373642921447754, -7.730299472808838, -7.086956024169922, -6.443612575531006, -5.80026912689209, -5.156925201416016, -4.513582229614258, -3.8702383041381836, -3.2268948554992676, -2.5835514068603516, -1.9402079582214355, -1.29686439037323, -0.6535208225250244, -0.010177373886108398, 0.6331660747528076, 1.2765097618103027, 1.9198532104492188, 2.5631966590881348, 3.206540107727051, 3.849883556365967, 4.493227005004883, 5.136570930480957, 5.779913902282715, 6.423257827758789, 7.066601276397705, 7.709944725036621, 8.353288650512695, 8.996631622314453, 9.639975547790527, 10.283318519592285, 10.92666244506836, 11.570005416870117, 12.213349342346191, 12.856693267822266, 13.50003719329834, 14.143380165100098, 14.786724090576172, 15.43006706237793, 16.073410034179688, 16.716754913330078, 17.360097885131836, 18.003440856933594]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 3.0, 7.0, 10.0, 24.0, 26.0, 32.0, 57.0, 77.0, 131.0, 229.0, 368.0, 616.0, 1228.0, 2837.0, 9861.0, 73895.0, 4056716.0, 37012.0, 6598.0, 2139.0, 985.0, 567.0, 281.0, 189.0, 123.0, 82.0, 63.0, 37.0, 25.0, 18.0, 19.0, 5.0, 8.0, 1.0, 4.0, 6.0, 7.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.609375, -3.46124267578125, -3.3131103515625, -3.16497802734375, -3.016845703125, -2.86871337890625, -2.7205810546875, -2.57244873046875, -2.42431640625, -2.27618408203125, -2.1280517578125, -1.97991943359375, -1.831787109375, -1.68365478515625, -1.5355224609375, -1.38739013671875, -1.2392578125, -1.09112548828125, -0.9429931640625, -0.79486083984375, -0.646728515625, -0.49859619140625, -0.3504638671875, -0.20233154296875, -0.05419921875, 0.09393310546875, 0.2420654296875, 0.39019775390625, 0.538330078125, 0.68646240234375, 0.8345947265625, 0.98272705078125, 1.130859375, 1.27899169921875, 1.4271240234375, 1.57525634765625, 1.723388671875, 1.87152099609375, 2.0196533203125, 2.16778564453125, 2.31591796875, 2.46405029296875, 2.6121826171875, 2.76031494140625, 2.908447265625, 3.05657958984375, 3.2047119140625, 3.35284423828125, 3.5009765625, 3.64910888671875, 3.7972412109375, 3.94537353515625, 4.093505859375, 4.24163818359375, 4.3897705078125, 4.53790283203125, 4.68603515625, 4.83416748046875, 4.9822998046875, 5.13043212890625, 5.278564453125, 5.42669677734375, 5.5748291015625, 5.72296142578125, 5.87109375]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 5.0, 9.0, 9.0, 14.0, 16.0, 37.0, 44.0, 59.0, 76.0, 102.0, 99.0, 101.0, 89.0, 80.0, 76.0, 56.0, 39.0, 39.0, 16.0, 10.0, 10.0, 9.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.791015625, -1.7340545654296875, -1.677093505859375, -1.6201324462890625, -1.56317138671875, -1.5062103271484375, -1.449249267578125, -1.3922882080078125, -1.3353271484375, -1.2783660888671875, -1.221405029296875, -1.1644439697265625, -1.10748291015625, -1.0505218505859375, -0.993560791015625, -0.9365997314453125, -0.879638671875, -0.8226776123046875, -0.765716552734375, -0.7087554931640625, -0.65179443359375, -0.5948333740234375, -0.537872314453125, -0.4809112548828125, -0.4239501953125, -0.3669891357421875, -0.310028076171875, -0.2530670166015625, -0.19610595703125, -0.1391448974609375, -0.082183837890625, -0.0252227783203125, 0.03173828125, 0.0886993408203125, 0.145660400390625, 0.2026214599609375, 0.25958251953125, 0.3165435791015625, 0.373504638671875, 0.4304656982421875, 0.4874267578125, 0.5443878173828125, 0.601348876953125, 0.6583099365234375, 0.71527099609375, 0.7722320556640625, 0.829193115234375, 0.8861541748046875, 0.943115234375, 1.0000762939453125, 1.057037353515625, 1.1139984130859375, 1.17095947265625, 1.2279205322265625, 1.284881591796875, 1.3418426513671875, 1.3988037109375, 1.4557647705078125, 1.512725830078125, 1.5696868896484375, 1.62664794921875, 1.6836090087890625, 1.740570068359375, 1.7975311279296875, 1.8544921875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 4.0, 4.0, 9.0, 6.0, 16.0, 17.0, 26.0, 45.0, 47.0, 56.0, 109.0, 131.0, 201.0, 294.0, 381.0, 586.0, 992.0, 1854.0, 3736.0, 7788.0, 20004.0, 78790.0, 3807073.0, 214495.0, 34566.0, 11633.0, 5038.0, 2505.0, 1412.0, 792.0, 489.0, 337.0, 232.0, 161.0, 129.0, 92.0, 70.0, 45.0, 34.0, 29.0, 16.0, 13.0, 8.0, 8.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-2.71875, -2.633056640625, -2.54736328125, -2.461669921875, -2.3759765625, -2.290283203125, -2.20458984375, -2.118896484375, -2.033203125, -1.947509765625, -1.86181640625, -1.776123046875, -1.6904296875, -1.604736328125, -1.51904296875, -1.433349609375, -1.34765625, -1.261962890625, -1.17626953125, -1.090576171875, -1.0048828125, -0.919189453125, -0.83349609375, -0.747802734375, -0.662109375, -0.576416015625, -0.49072265625, -0.405029296875, -0.3193359375, -0.233642578125, -0.14794921875, -0.062255859375, 0.0234375, 0.109130859375, 0.19482421875, 0.280517578125, 0.3662109375, 0.451904296875, 0.53759765625, 0.623291015625, 0.708984375, 0.794677734375, 0.88037109375, 0.966064453125, 1.0517578125, 1.137451171875, 1.22314453125, 1.308837890625, 1.39453125, 1.480224609375, 1.56591796875, 1.651611328125, 1.7373046875, 1.822998046875, 1.90869140625, 1.994384765625, 2.080078125, 2.165771484375, 2.25146484375, 2.337158203125, 2.4228515625, 2.508544921875, 2.59423828125, 2.679931640625, 2.765625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 8.0, 11.0, 10.0, 8.0, 12.0, 19.0, 35.0, 56.0, 90.0, 213.0, 3031.0, 269.0, 101.0, 70.0, 41.0, 18.0, 17.0, 13.0, 11.0, 5.0, 9.0, 4.0, 7.0, 2.0, 4.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.97119140625, -0.9315872192382812, -0.8919830322265625, -0.8523788452148438, -0.812774658203125, -0.7731704711914062, -0.7335662841796875, -0.6939620971679688, -0.65435791015625, -0.6147537231445312, -0.5751495361328125, -0.5355453491210938, -0.495941162109375, -0.45633697509765625, -0.4167327880859375, -0.37712860107421875, -0.3375244140625, -0.29792022705078125, -0.2583160400390625, -0.21871185302734375, -0.179107666015625, -0.13950347900390625, -0.0998992919921875, -0.06029510498046875, -0.02069091796875, 0.01891326904296875, 0.0585174560546875, 0.09812164306640625, 0.137725830078125, 0.17733001708984375, 0.2169342041015625, 0.25653839111328125, 0.296142578125, 0.33574676513671875, 0.3753509521484375, 0.41495513916015625, 0.454559326171875, 0.49416351318359375, 0.5337677001953125, 0.5733718872070312, 0.61297607421875, 0.6525802612304688, 0.6921844482421875, 0.7317886352539062, 0.771392822265625, 0.8109970092773438, 0.8506011962890625, 0.8902053833007812, 0.9298095703125, 0.9694137573242188, 1.0090179443359375, 1.0486221313476562, 1.088226318359375, 1.1278305053710938, 1.1674346923828125, 1.2070388793945312, 1.24664306640625, 1.2862472534179688, 1.3258514404296875, 1.3654556274414062, 1.405059814453125, 1.4446640014648438, 1.4842681884765625, 1.5238723754882812, 1.5634765625]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 3.0, 11.0, 16.0, 31.0, 35.0, 66.0, 86.0, 102.0, 118.0, 105.0, 99.0, 83.0, 64.0, 42.0, 28.0, 25.0, 24.0, 16.0, 15.0, 13.0, 5.0, 2.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5456020832061768, -3.344350814819336, -3.143099784851074, -2.9418485164642334, -2.7405972480773926, -2.539346218109131, -2.33809494972229, -2.136843681335449, -1.9355926513671875, -1.7343415021896362, -1.533090353012085, -1.3318390846252441, -1.1305879354476929, -0.9293367862701416, -0.7280855178833008, -0.5268343687057495, -0.32558321952819824, -0.12433204054832458, 0.07691913843154907, 0.2781703472137451, 0.4794214963912964, 0.6806726455688477, 0.8819239139556885, 1.0831750631332397, 1.284426212310791, 1.4856773614883423, 1.6869285106658936, 1.8881797790527344, 2.089430809020996, 2.290682077407837, 2.4919333457946777, 2.6931843757629395, 2.8944358825683594, 3.0956871509552, 3.296938180923462, 3.4981894493103027, 3.6994404792785645, 3.9006917476654053, 4.101943016052246, 4.303194046020508, 4.5044450759887695, 4.705696105957031, 4.906947612762451, 5.108198642730713, 5.309449672698975, 5.5107011795043945, 5.711952209472656, 5.913203239440918, 6.114454746246338, 6.3157057762146, 6.5169572830200195, 6.718208312988281, 6.919459342956543, 7.120710372924805, 7.321961879730225, 7.523212909698486, 7.724464416503906, 7.925715446472168, 8.12696647644043, 8.328218460083008, 8.52946949005127, 8.730720520019531, 8.931971549987793, 9.133222579956055, 9.334473609924316]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 6.0, 1.0, 1.0, 3.0, 7.0, 3.0, 7.0, 16.0, 5.0, 10.0, 14.0, 11.0, 13.0, 19.0, 14.0, 25.0, 21.0, 20.0, 34.0, 29.0, 22.0, 32.0, 27.0, 25.0, 32.0, 37.0, 34.0, 30.0, 34.0, 38.0, 44.0, 34.0, 30.0, 34.0, 23.0, 37.0, 32.0, 33.0, 22.0, 12.0, 28.0, 27.0, 16.0, 11.0, 13.0, 11.0, 9.0, 5.0, 3.0, 5.0, 4.0, 6.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.8851871490478516, -3.7598843574523926, -3.6345813274383545, -3.5092785358428955, -3.3839755058288574, -3.2586727142333984, -3.1333699226379395, -3.0080671310424805, -2.8827641010284424, -2.7574613094329834, -2.6321582794189453, -2.5068554878234863, -2.3815526962280273, -2.2562496662139893, -2.1309468746185303, -2.005643844604492, -1.8803410530090332, -1.7550381422042847, -1.6297352313995361, -1.5044324398040771, -1.3791295289993286, -1.25382661819458, -1.128523826599121, -1.0032209157943726, -0.877918004989624, -0.7526150941848755, -0.6273122429847717, -0.502009391784668, -0.37670648097991943, -0.2514035701751709, -0.12610071897506714, -0.0007978677749633789, 0.12450456619262695, 0.2498074471950531, 0.37511032819747925, 0.500413179397583, 0.6257160902023315, 0.7510190010070801, 0.8763218522071838, 1.0016247034072876, 1.1269276142120361, 1.2522305250167847, 1.3775334358215332, 1.5028362274169922, 1.6281391382217407, 1.7534420490264893, 1.8787448406219482, 2.0040478706359863, 2.1293506622314453, 2.2546534538269043, 2.3799564838409424, 2.5052592754364014, 2.6305623054504395, 2.7558650970458984, 2.8811678886413574, 3.0064706802368164, 3.1317737102508545, 3.2570765018463135, 3.3823795318603516, 3.5076823234558105, 3.6329851150512695, 3.7582881450653076, 3.8835909366607666, 4.008893966674805, 4.134196758270264]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 3.0, 2.0, 8.0, 11.0, 9.0, 11.0, 21.0, 29.0, 44.0, 51.0, 100.0, 139.0, 256.0, 489.0, 953.0, 1776.0, 3909.0, 10122.0, 28554.0, 92678.0, 306794.0, 397029.0, 140079.0, 41239.0, 13941.0, 5521.0, 2235.0, 1109.0, 606.0, 324.0, 192.0, 116.0, 80.0, 35.0, 31.0, 18.0, 12.0, 15.0, 3.0, 4.0, 3.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0], "bins": [-3.1015625, -3.020294189453125, -2.93902587890625, -2.857757568359375, -2.7764892578125, -2.695220947265625, -2.61395263671875, -2.532684326171875, -2.451416015625, -2.370147705078125, -2.28887939453125, -2.207611083984375, -2.1263427734375, -2.045074462890625, -1.96380615234375, -1.882537841796875, -1.80126953125, -1.720001220703125, -1.63873291015625, -1.557464599609375, -1.4761962890625, -1.394927978515625, -1.31365966796875, -1.232391357421875, -1.151123046875, -1.069854736328125, -0.98858642578125, -0.907318115234375, -0.8260498046875, -0.744781494140625, -0.66351318359375, -0.582244873046875, -0.5009765625, -0.419708251953125, -0.33843994140625, -0.257171630859375, -0.1759033203125, -0.094635009765625, -0.01336669921875, 0.067901611328125, 0.149169921875, 0.230438232421875, 0.31170654296875, 0.392974853515625, 0.4742431640625, 0.555511474609375, 0.63677978515625, 0.718048095703125, 0.79931640625, 0.880584716796875, 0.96185302734375, 1.043121337890625, 1.1243896484375, 1.205657958984375, 1.28692626953125, 1.368194580078125, 1.449462890625, 1.530731201171875, 1.61199951171875, 1.693267822265625, 1.7745361328125, 1.855804443359375, 1.93707275390625, 2.018341064453125, 2.099609375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 1.0, 3.0, 5.0, 9.0, 9.0, 5.0, 11.0, 13.0, 22.0, 35.0, 36.0, 42.0, 43.0, 73.0, 81.0, 74.0, 75.0, 83.0, 60.0, 57.0, 51.0, 47.0, 51.0, 30.0, 24.0, 14.0, 12.0, 14.0, 10.0, 9.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.599609375, -1.5506591796875, -1.501708984375, -1.4527587890625, -1.40380859375, -1.3548583984375, -1.305908203125, -1.2569580078125, -1.2080078125, -1.1590576171875, -1.110107421875, -1.0611572265625, -1.01220703125, -0.9632568359375, -0.914306640625, -0.8653564453125, -0.81640625, -0.7674560546875, -0.718505859375, -0.6695556640625, -0.62060546875, -0.5716552734375, -0.522705078125, -0.4737548828125, -0.4248046875, -0.3758544921875, -0.326904296875, -0.2779541015625, -0.22900390625, -0.1800537109375, -0.131103515625, -0.0821533203125, -0.033203125, 0.0157470703125, 0.064697265625, 0.1136474609375, 0.16259765625, 0.2115478515625, 0.260498046875, 0.3094482421875, 0.3583984375, 0.4073486328125, 0.456298828125, 0.5052490234375, 0.55419921875, 0.6031494140625, 0.652099609375, 0.7010498046875, 0.75, 0.7989501953125, 0.847900390625, 0.8968505859375, 0.94580078125, 0.9947509765625, 1.043701171875, 1.0926513671875, 1.1416015625, 1.1905517578125, 1.239501953125, 1.2884521484375, 1.33740234375, 1.3863525390625, 1.435302734375, 1.4842529296875, 1.533203125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 9.0, 6.0, 6.0, 6.0, 7.0, 8.0, 8.0, 17.0, 35.0, 20.0, 43.0, 63.0, 90.0, 114.0, 225.0, 350.0, 576.0, 1168.0, 2511.0, 6446.0, 22367.0, 108384.0, 535327.0, 297693.0, 52321.0, 12619.0, 4208.0, 1756.0, 864.0, 506.0, 255.0, 167.0, 103.0, 82.0, 52.0, 33.0, 28.0, 34.0, 11.0, 12.0, 9.0, 3.0, 5.0, 3.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.326171875, -3.22772216796875, -3.1292724609375, -3.03082275390625, -2.932373046875, -2.83392333984375, -2.7354736328125, -2.63702392578125, -2.53857421875, -2.44012451171875, -2.3416748046875, -2.24322509765625, -2.144775390625, -2.04632568359375, -1.9478759765625, -1.84942626953125, -1.7509765625, -1.65252685546875, -1.5540771484375, -1.45562744140625, -1.357177734375, -1.25872802734375, -1.1602783203125, -1.06182861328125, -0.96337890625, -0.86492919921875, -0.7664794921875, -0.66802978515625, -0.569580078125, -0.47113037109375, -0.3726806640625, -0.27423095703125, -0.17578125, -0.07733154296875, 0.0211181640625, 0.11956787109375, 0.218017578125, 0.31646728515625, 0.4149169921875, 0.51336669921875, 0.61181640625, 0.71026611328125, 0.8087158203125, 0.90716552734375, 1.005615234375, 1.10406494140625, 1.2025146484375, 1.30096435546875, 1.3994140625, 1.49786376953125, 1.5963134765625, 1.69476318359375, 1.793212890625, 1.89166259765625, 1.9901123046875, 2.08856201171875, 2.18701171875, 2.28546142578125, 2.3839111328125, 2.48236083984375, 2.580810546875, 2.67926025390625, 2.7777099609375, 2.87615966796875, 2.974609375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 2.0, 6.0, 7.0, 6.0, 11.0, 17.0, 19.0, 23.0, 28.0, 39.0, 44.0, 51.0, 48.0, 56.0, 71.0, 77.0, 62.0, 48.0, 48.0, 66.0, 54.0, 47.0, 33.0, 28.0, 37.0, 27.0, 10.0, 12.0, 6.0, 4.0, 6.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.29296875, -6.10784912109375, -5.9227294921875, -5.73760986328125, -5.552490234375, -5.36737060546875, -5.1822509765625, -4.99713134765625, -4.81201171875, -4.62689208984375, -4.4417724609375, -4.25665283203125, -4.071533203125, -3.88641357421875, -3.7012939453125, -3.51617431640625, -3.3310546875, -3.14593505859375, -2.9608154296875, -2.77569580078125, -2.590576171875, -2.40545654296875, -2.2203369140625, -2.03521728515625, -1.85009765625, -1.66497802734375, -1.4798583984375, -1.29473876953125, -1.109619140625, -0.92449951171875, -0.7393798828125, -0.55426025390625, -0.369140625, -0.18402099609375, 0.0010986328125, 0.18621826171875, 0.371337890625, 0.55645751953125, 0.7415771484375, 0.92669677734375, 1.11181640625, 1.29693603515625, 1.4820556640625, 1.66717529296875, 1.852294921875, 2.03741455078125, 2.2225341796875, 2.40765380859375, 2.5927734375, 2.77789306640625, 2.9630126953125, 3.14813232421875, 3.333251953125, 3.51837158203125, 3.7034912109375, 3.88861083984375, 4.07373046875, 4.25885009765625, 4.4439697265625, 4.62908935546875, 4.814208984375, 4.99932861328125, 5.1844482421875, 5.36956787109375, 5.5546875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 6.0, 7.0, 10.0, 11.0, 17.0, 20.0, 58.0, 135.0, 316.0, 930.0, 4832.0, 97352.0, 902893.0, 37901.0, 2998.0, 642.0, 221.0, 100.0, 46.0, 27.0, 16.0, 6.0, 6.0, 5.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.314453125, -3.238037109375, -3.16162109375, -3.085205078125, -3.0087890625, -2.932373046875, -2.85595703125, -2.779541015625, -2.703125, -2.626708984375, -2.55029296875, -2.473876953125, -2.3974609375, -2.321044921875, -2.24462890625, -2.168212890625, -2.091796875, -2.015380859375, -1.93896484375, -1.862548828125, -1.7861328125, -1.709716796875, -1.63330078125, -1.556884765625, -1.48046875, -1.404052734375, -1.32763671875, -1.251220703125, -1.1748046875, -1.098388671875, -1.02197265625, -0.945556640625, -0.869140625, -0.792724609375, -0.71630859375, -0.639892578125, -0.5634765625, -0.487060546875, -0.41064453125, -0.334228515625, -0.2578125, -0.181396484375, -0.10498046875, -0.028564453125, 0.0478515625, 0.124267578125, 0.20068359375, 0.277099609375, 0.353515625, 0.429931640625, 0.50634765625, 0.582763671875, 0.6591796875, 0.735595703125, 0.81201171875, 0.888427734375, 0.96484375, 1.041259765625, 1.11767578125, 1.194091796875, 1.2705078125, 1.346923828125, 1.42333984375, 1.499755859375, 1.576171875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 6.0, 6.0, 10.0, 15.0, 19.0, 21.0, 35.0, 47.0, 74.0, 85.0, 100.0, 109.0, 106.0, 75.0, 54.0, 73.0, 48.0, 29.0, 24.0, 19.0, 10.0, 11.0, 4.0, 6.0, 5.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0002689361572265625, -0.0002620033919811249, -0.00025507062673568726, -0.00024813786149024963, -0.000241205096244812, -0.0002342723309993744, -0.00022733956575393677, -0.00022040680050849915, -0.00021347403526306152, -0.0002065412700176239, -0.00019960850477218628, -0.00019267573952674866, -0.00018574297428131104, -0.0001788102090358734, -0.0001718774437904358, -0.00016494467854499817, -0.00015801191329956055, -0.00015107914805412292, -0.0001441463828086853, -0.00013721361756324768, -0.00013028085231781006, -0.00012334808707237244, -0.00011641532182693481, -0.00010948255658149719, -0.00010254979133605957, -9.561702609062195e-05, -8.868426084518433e-05, -8.17514955997467e-05, -7.481873035430908e-05, -6.788596510887146e-05, -6.095319986343384e-05, -5.4020434617996216e-05, -4.7087669372558594e-05, -4.015490412712097e-05, -3.322213888168335e-05, -2.6289373636245728e-05, -1.9356608390808105e-05, -1.2423843145370483e-05, -5.491077899932861e-06, 1.4416873455047607e-06, 8.374452590942383e-06, 1.5307217836380005e-05, 2.2239983081817627e-05, 2.917274832725525e-05, 3.610551357269287e-05, 4.303827881813049e-05, 4.9971044063568115e-05, 5.690380930900574e-05, 6.383657455444336e-05, 7.076933979988098e-05, 7.77021050453186e-05, 8.463487029075623e-05, 9.156763553619385e-05, 9.850040078163147e-05, 0.00010543316602706909, 0.00011236593127250671, 0.00011929869651794434, 0.00012623146176338196, 0.00013316422700881958, 0.0001400969922542572, 0.00014702975749969482, 0.00015396252274513245, 0.00016089528799057007, 0.0001678280532360077, 0.0001747608184814453]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 5.0, 3.0, 5.0, 4.0, 5.0, 11.0, 10.0, 10.0, 16.0, 24.0, 47.0, 51.0, 84.0, 172.0, 311.0, 540.0, 1126.0, 3000.0, 10576.0, 64159.0, 604797.0, 320168.0, 32473.0, 6865.0, 2186.0, 875.0, 426.0, 226.0, 125.0, 79.0, 42.0, 43.0, 21.0, 24.0, 16.0, 5.0, 8.0, 7.0, 3.0, 4.0, 1.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.2529296875, -1.2109375, -1.1689453125, -1.126953125, -1.0849609375, -1.04296875, -1.0009765625, -0.958984375, -0.9169921875, -0.875, -0.8330078125, -0.791015625, -0.7490234375, -0.70703125, -0.6650390625, -0.623046875, -0.5810546875, -0.5390625, -0.4970703125, -0.455078125, -0.4130859375, -0.37109375, -0.3291015625, -0.287109375, -0.2451171875, -0.203125, -0.1611328125, -0.119140625, -0.0771484375, -0.03515625, 0.0068359375, 0.048828125, 0.0908203125, 0.1328125, 0.1748046875, 0.216796875, 0.2587890625, 0.30078125, 0.3427734375, 0.384765625, 0.4267578125, 0.46875, 0.5107421875, 0.552734375, 0.5947265625, 0.63671875, 0.6787109375, 0.720703125, 0.7626953125, 0.8046875, 0.8466796875, 0.888671875, 0.9306640625, 0.97265625, 1.0146484375, 1.056640625, 1.0986328125, 1.140625, 1.1826171875, 1.224609375, 1.2666015625, 1.30859375, 1.3505859375, 1.392578125, 1.4345703125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 4.0, 0.0, 2.0, 5.0, 8.0, 11.0, 2.0, 10.0, 17.0, 18.0, 29.0, 35.0, 52.0, 61.0, 82.0, 90.0, 91.0, 84.0, 70.0, 75.0, 51.0, 46.0, 41.0, 29.0, 26.0, 16.0, 10.0, 8.0, 5.0, 9.0, 7.0, 2.0, 6.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4423828125, -1.402130126953125, -1.36187744140625, -1.321624755859375, -1.2813720703125, -1.241119384765625, -1.20086669921875, -1.160614013671875, -1.120361328125, -1.080108642578125, -1.03985595703125, -0.999603271484375, -0.9593505859375, -0.919097900390625, -0.87884521484375, -0.838592529296875, -0.79833984375, -0.758087158203125, -0.71783447265625, -0.677581787109375, -0.6373291015625, -0.597076416015625, -0.55682373046875, -0.516571044921875, -0.476318359375, -0.436065673828125, -0.39581298828125, -0.355560302734375, -0.3153076171875, -0.275054931640625, -0.23480224609375, -0.194549560546875, -0.154296875, -0.114044189453125, -0.07379150390625, -0.033538818359375, 0.0067138671875, 0.046966552734375, 0.08721923828125, 0.127471923828125, 0.167724609375, 0.207977294921875, 0.24822998046875, 0.288482666015625, 0.3287353515625, 0.368988037109375, 0.40924072265625, 0.449493408203125, 0.48974609375, 0.529998779296875, 0.57025146484375, 0.610504150390625, 0.6507568359375, 0.691009521484375, 0.73126220703125, 0.771514892578125, 0.811767578125, 0.852020263671875, 0.89227294921875, 0.932525634765625, 0.9727783203125, 1.013031005859375, 1.05328369140625, 1.093536376953125, 1.1337890625]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 12.0, 23.0, 44.0, 76.0, 154.0, 198.0, 169.0, 154.0, 83.0, 39.0, 29.0, 10.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.013925552368164, -23.882144927978516, -22.750364303588867, -21.61858367919922, -20.48680305480957, -19.355022430419922, -18.223241806030273, -17.091461181640625, -15.959680557250977, -14.827899932861328, -13.69611930847168, -12.564338684082031, -11.432558059692383, -10.300777435302734, -9.168996810913086, -8.037216186523438, -6.905435562133789, -5.773654937744141, -4.641874313354492, -3.5100936889648438, -2.3783130645751953, -1.2465324401855469, -0.11475181579589844, 1.01702880859375, 2.1488094329833984, 3.280590057373047, 4.412370681762695, 5.544151306152344, 6.675931930541992, 7.807712554931641, 8.939493179321289, 10.071273803710938, 11.203056335449219, 12.334836959838867, 13.466617584228516, 14.598398208618164, 15.730178833007812, 16.86195945739746, 17.99374008178711, 19.125520706176758, 20.257301330566406, 21.389081954956055, 22.520862579345703, 23.65264320373535, 24.784423828125, 25.91620445251465, 27.047985076904297, 28.179765701293945, 29.311546325683594, 30.443326950073242, 31.57510757446289, 32.706886291503906, 33.83866882324219, 34.97045135498047, 36.102230072021484, 37.2340087890625, 38.36579132080078, 39.49757385253906, 40.62935256958008, 41.761131286621094, 42.892913818359375, 44.024696350097656, 45.15647506713867, 46.28825378417969, 47.42003631591797]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 5.0, 5.0, 8.0, 8.0, 9.0, 18.0, 15.0, 20.0, 21.0, 22.0, 35.0, 32.0, 44.0, 47.0, 47.0, 54.0, 68.0, 60.0, 55.0, 57.0, 60.0, 43.0, 47.0, 17.0, 46.0, 35.0, 23.0, 23.0, 24.0, 19.0, 11.0, 5.0, 7.0, 3.0, 7.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-26.314420700073242, -25.57833480834961, -24.842247009277344, -24.10616111755371, -23.370073318481445, -22.633987426757812, -21.897899627685547, -21.161813735961914, -20.42572784423828, -19.68964195251465, -18.953554153442383, -18.21746826171875, -17.481380462646484, -16.74529457092285, -16.00920867919922, -15.273120880126953, -14.537034034729004, -13.800947189331055, -13.064860343933105, -12.328773498535156, -11.592687606811523, -10.856600761413574, -10.120513916015625, -9.384428024291992, -8.648340225219727, -7.912253379821777, -7.176167011260986, -6.440080165863037, -5.703993797302246, -4.967906951904297, -4.231820106506348, -3.4957337379455566, -2.7596473693847656, -2.0235607624053955, -1.2874740362167358, -0.5513873100280762, 0.18469929695129395, 0.9207859039306641, 1.6568727493286133, 2.3929591178894043, 3.1290459632873535, 3.8651325702667236, 4.601219177246094, 5.337306022644043, 6.073392868041992, 6.809479236602783, 7.545566082000732, 8.281652450561523, 9.017739295959473, 9.753826141357422, 10.489912986755371, 11.22599983215332, 11.962085723876953, 12.698172569274902, 13.434259414672852, 14.170345306396484, 14.90643310546875, 15.6425199508667, 16.37860679626465, 17.11469268798828, 17.850780487060547, 18.58686637878418, 19.322952270507812, 20.059040069580078, 20.79512596130371]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 3.0, 8.0, 6.0, 13.0, 18.0, 33.0, 51.0, 85.0, 145.0, 244.0, 465.0, 1029.0, 2223.0, 5363.0, 15076.0, 56912.0, 624502.0, 3312957.0, 133772.0, 26368.0, 8526.0, 3376.0, 1384.0, 758.0, 400.0, 202.0, 109.0, 92.0, 52.0, 36.0, 20.0, 15.0, 14.0, 6.0, 5.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.07421875, -1.998077392578125, -1.92193603515625, -1.845794677734375, -1.7696533203125, -1.693511962890625, -1.61737060546875, -1.541229248046875, -1.465087890625, -1.388946533203125, -1.31280517578125, -1.236663818359375, -1.1605224609375, -1.084381103515625, -1.00823974609375, -0.932098388671875, -0.85595703125, -0.779815673828125, -0.70367431640625, -0.627532958984375, -0.5513916015625, -0.475250244140625, -0.39910888671875, -0.322967529296875, -0.246826171875, -0.170684814453125, -0.09454345703125, -0.018402099609375, 0.0577392578125, 0.133880615234375, 0.21002197265625, 0.286163330078125, 0.3623046875, 0.438446044921875, 0.51458740234375, 0.590728759765625, 0.6668701171875, 0.743011474609375, 0.81915283203125, 0.895294189453125, 0.971435546875, 1.047576904296875, 1.12371826171875, 1.199859619140625, 1.2760009765625, 1.352142333984375, 1.42828369140625, 1.504425048828125, 1.58056640625, 1.656707763671875, 1.73284912109375, 1.808990478515625, 1.8851318359375, 1.961273193359375, 2.03741455078125, 2.113555908203125, 2.189697265625, 2.265838623046875, 2.34197998046875, 2.418121337890625, 2.4942626953125, 2.570404052734375, 2.64654541015625, 2.722686767578125, 2.798828125]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 7.0, 8.0, 7.0, 8.0, 12.0, 25.0, 20.0, 31.0, 35.0, 32.0, 40.0, 46.0, 54.0, 53.0, 65.0, 62.0, 58.0, 56.0, 60.0, 42.0, 37.0, 39.0, 42.0, 38.0, 25.0, 23.0, 12.0, 16.0, 10.0, 10.0, 9.0, 9.0, 3.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.96630859375, -0.9319381713867188, -0.8975677490234375, -0.8631973266601562, -0.828826904296875, -0.7944564819335938, -0.7600860595703125, -0.7257156372070312, -0.69134521484375, -0.6569747924804688, -0.6226043701171875, -0.5882339477539062, -0.553863525390625, -0.5194931030273438, -0.4851226806640625, -0.45075225830078125, -0.4163818359375, -0.38201141357421875, -0.3476409912109375, -0.31327056884765625, -0.278900146484375, -0.24452972412109375, -0.2101593017578125, -0.17578887939453125, -0.14141845703125, -0.10704803466796875, -0.0726776123046875, -0.03830718994140625, -0.003936767578125, 0.03043365478515625, 0.0648040771484375, 0.09917449951171875, 0.133544921875, 0.16791534423828125, 0.2022857666015625, 0.23665618896484375, 0.271026611328125, 0.30539703369140625, 0.3397674560546875, 0.37413787841796875, 0.40850830078125, 0.44287872314453125, 0.4772491455078125, 0.5116195678710938, 0.545989990234375, 0.5803604125976562, 0.6147308349609375, 0.6491012573242188, 0.6834716796875, 0.7178421020507812, 0.7522125244140625, 0.7865829467773438, 0.820953369140625, 0.8553237915039062, 0.8896942138671875, 0.9240646362304688, 0.95843505859375, 0.9928054809570312, 1.0271759033203125, 1.0615463256835938, 1.095916748046875, 1.1302871704101562, 1.1646575927734375, 1.1990280151367188, 1.2333984375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 5.0, 2.0, 4.0, 0.0, 6.0, 9.0, 5.0, 14.0, 25.0, 28.0, 81.0, 146.0, 350.0, 1000.0, 3940.0, 22370.0, 373989.0, 3718752.0, 62358.0, 8333.0, 1928.0, 534.0, 189.0, 88.0, 46.0, 24.0, 19.0, 12.0, 11.0, 6.0, 5.0, 1.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.35546875, -4.20648193359375, -4.0574951171875, -3.90850830078125, -3.759521484375, -3.61053466796875, -3.4615478515625, -3.31256103515625, -3.16357421875, -3.01458740234375, -2.8656005859375, -2.71661376953125, -2.567626953125, -2.41864013671875, -2.2696533203125, -2.12066650390625, -1.9716796875, -1.82269287109375, -1.6737060546875, -1.52471923828125, -1.375732421875, -1.22674560546875, -1.0777587890625, -0.92877197265625, -0.77978515625, -0.63079833984375, -0.4818115234375, -0.33282470703125, -0.183837890625, -0.03485107421875, 0.1141357421875, 0.26312255859375, 0.412109375, 0.56109619140625, 0.7100830078125, 0.85906982421875, 1.008056640625, 1.15704345703125, 1.3060302734375, 1.45501708984375, 1.60400390625, 1.75299072265625, 1.9019775390625, 2.05096435546875, 2.199951171875, 2.34893798828125, 2.4979248046875, 2.64691162109375, 2.7958984375, 2.94488525390625, 3.0938720703125, 3.24285888671875, 3.391845703125, 3.54083251953125, 3.6898193359375, 3.83880615234375, 3.98779296875, 4.13677978515625, 4.2857666015625, 4.43475341796875, 4.583740234375, 4.73272705078125, 4.8817138671875, 5.03070068359375, 5.1796875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 5.0, 6.0, 10.0, 8.0, 13.0, 19.0, 24.0, 36.0, 51.0, 102.0, 144.0, 304.0, 767.0, 1511.0, 583.0, 208.0, 95.0, 45.0, 41.0, 29.0, 19.0, 13.0, 14.0, 5.0, 7.0, 4.0, 2.0, 1.0, 5.0, 3.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.33203125, -4.2188720703125, -4.105712890625, -3.9925537109375, -3.87939453125, -3.7662353515625, -3.653076171875, -3.5399169921875, -3.4267578125, -3.3135986328125, -3.200439453125, -3.0872802734375, -2.97412109375, -2.8609619140625, -2.747802734375, -2.6346435546875, -2.521484375, -2.4083251953125, -2.295166015625, -2.1820068359375, -2.06884765625, -1.9556884765625, -1.842529296875, -1.7293701171875, -1.6162109375, -1.5030517578125, -1.389892578125, -1.2767333984375, -1.16357421875, -1.0504150390625, -0.937255859375, -0.8240966796875, -0.7109375, -0.5977783203125, -0.484619140625, -0.3714599609375, -0.25830078125, -0.1451416015625, -0.031982421875, 0.0811767578125, 0.1943359375, 0.3074951171875, 0.420654296875, 0.5338134765625, 0.64697265625, 0.7601318359375, 0.873291015625, 0.9864501953125, 1.099609375, 1.2127685546875, 1.325927734375, 1.4390869140625, 1.55224609375, 1.6654052734375, 1.778564453125, 1.8917236328125, 2.0048828125, 2.1180419921875, 2.231201171875, 2.3443603515625, 2.45751953125, 2.5706787109375, 2.683837890625, 2.7969970703125, 2.91015625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 7.0, 5.0, 9.0, 21.0, 33.0, 76.0, 133.0, 243.0, 219.0, 127.0, 78.0, 29.0, 12.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.203954696655273, -27.14052963256836, -26.077106475830078, -25.013681411743164, -23.95025634765625, -22.88683319091797, -21.823408126831055, -20.75998306274414, -19.69655990600586, -18.633134841918945, -17.569711685180664, -16.50628662109375, -15.442862510681152, -14.379438400268555, -13.31601333618164, -12.252589225769043, -11.189165115356445, -10.125741004943848, -9.06231689453125, -7.998891830444336, -6.935467720031738, -5.872043609619141, -4.808619022369385, -3.745194435119629, -2.6817703247070312, -1.6183459758758545, -0.5549216270446777, 0.508502721786499, 1.5719270706176758, 2.6353511810302734, 3.6987757682800293, 4.762200355529785, 5.82562255859375, 6.889046669006348, 7.9524712562561035, 9.01589584350586, 10.079319953918457, 11.142744064331055, 12.206169128417969, 13.269593238830566, 14.333017349243164, 15.396441459655762, 16.45986557006836, 17.523290634155273, 18.586715698242188, 19.65013885498047, 20.713563919067383, 21.776988983154297, 22.840412139892578, 23.903837203979492, 24.967260360717773, 26.030685424804688, 27.09410858154297, 28.157533645629883, 29.220958709716797, 30.284381866455078, 31.347806930541992, 32.411231994628906, 33.47465515136719, 34.53807830810547, 35.601505279541016, 36.6649284362793, 37.72835159301758, 38.791778564453125, 39.855201721191406]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 4.0, 5.0, 7.0, 13.0, 17.0, 16.0, 23.0, 29.0, 31.0, 41.0, 27.0, 47.0, 54.0, 58.0, 65.0, 83.0, 64.0, 66.0, 62.0, 55.0, 44.0, 41.0, 33.0, 30.0, 23.0, 19.0, 16.0, 9.0, 3.0, 5.0, 7.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.64159393310547, -16.08203887939453, -15.522483825683594, -14.962928771972656, -14.403374671936035, -13.843819618225098, -13.28426456451416, -12.724709510803223, -12.165155410766602, -11.605600357055664, -11.046045303344727, -10.486490249633789, -9.926936149597168, -9.36738109588623, -8.807826042175293, -8.248270988464355, -7.688715934753418, -7.1291608810424805, -6.569606304168701, -6.010051250457764, -5.450496673583984, -4.890941619873047, -4.331386566162109, -3.771831750869751, -3.2122769355773926, -2.652722120285034, -2.093167304992676, -1.5336122512817383, -0.9740574359893799, -0.4145026206970215, 0.14505243301391602, 0.7046072483062744, 1.2641620635986328, 1.8237168788909912, 2.3832716941833496, 2.942826747894287, 3.5023815631866455, 4.061936378479004, 4.621491432189941, 5.181046485900879, 5.740601062774658, 6.300156116485596, 6.859710693359375, 7.4192657470703125, 7.97882080078125, 8.538375854492188, 9.097930908203125, 9.657485008239746, 10.217040061950684, 10.776595115661621, 11.336150169372559, 11.89570426940918, 12.455259323120117, 13.014814376831055, 13.574369430541992, 14.13392448425293, 14.693479537963867, 15.253034591674805, 15.812589645385742, 16.37214469909668, 16.931699752807617, 17.491252899169922, 18.05080795288086, 18.610363006591797, 19.169918060302734]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 1.0, 8.0, 7.0, 9.0, 21.0, 23.0, 35.0, 56.0, 91.0, 127.0, 186.0, 300.0, 517.0, 863.0, 1439.0, 2460.0, 4559.0, 8779.0, 17123.0, 36152.0, 76015.0, 157046.0, 264373.0, 235266.0, 125374.0, 59923.0, 28160.0, 13727.0, 7011.0, 3756.0, 2095.0, 1177.0, 692.0, 394.0, 264.0, 166.0, 123.0, 83.0, 54.0, 38.0, 30.0, 19.0, 4.0, 5.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.361328125, -1.3171844482421875, -1.273040771484375, -1.2288970947265625, -1.18475341796875, -1.1406097412109375, -1.096466064453125, -1.0523223876953125, -1.0081787109375, -0.9640350341796875, -0.919891357421875, -0.8757476806640625, -0.83160400390625, -0.7874603271484375, -0.743316650390625, -0.6991729736328125, -0.655029296875, -0.6108856201171875, -0.566741943359375, -0.5225982666015625, -0.47845458984375, -0.4343109130859375, -0.390167236328125, -0.3460235595703125, -0.3018798828125, -0.2577362060546875, -0.213592529296875, -0.1694488525390625, -0.12530517578125, -0.0811614990234375, -0.037017822265625, 0.0071258544921875, 0.05126953125, 0.0954132080078125, 0.139556884765625, 0.1837005615234375, 0.22784423828125, 0.2719879150390625, 0.316131591796875, 0.3602752685546875, 0.4044189453125, 0.4485626220703125, 0.492706298828125, 0.5368499755859375, 0.58099365234375, 0.6251373291015625, 0.669281005859375, 0.7134246826171875, 0.757568359375, 0.8017120361328125, 0.845855712890625, 0.8899993896484375, 0.93414306640625, 0.9782867431640625, 1.022430419921875, 1.0665740966796875, 1.1107177734375, 1.1548614501953125, 1.199005126953125, 1.2431488037109375, 1.28729248046875, 1.3314361572265625, 1.375579833984375, 1.4197235107421875, 1.4638671875]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 3.0, 4.0, 0.0, 4.0, 6.0, 13.0, 16.0, 19.0, 25.0, 29.0, 32.0, 33.0, 53.0, 33.0, 46.0, 63.0, 47.0, 44.0, 54.0, 49.0, 56.0, 48.0, 62.0, 36.0, 40.0, 32.0, 24.0, 20.0, 31.0, 18.0, 16.0, 10.0, 8.0, 8.0, 6.0, 5.0, 7.0, 4.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0244140625, -0.9920806884765625, -0.959747314453125, -0.9274139404296875, -0.89508056640625, -0.8627471923828125, -0.830413818359375, -0.7980804443359375, -0.7657470703125, -0.7334136962890625, -0.701080322265625, -0.6687469482421875, -0.63641357421875, -0.6040802001953125, -0.571746826171875, -0.5394134521484375, -0.507080078125, -0.4747467041015625, -0.442413330078125, -0.4100799560546875, -0.37774658203125, -0.3454132080078125, -0.313079833984375, -0.2807464599609375, -0.2484130859375, -0.2160797119140625, -0.183746337890625, -0.1514129638671875, -0.11907958984375, -0.0867462158203125, -0.054412841796875, -0.0220794677734375, 0.01025390625, 0.0425872802734375, 0.074920654296875, 0.1072540283203125, 0.13958740234375, 0.1719207763671875, 0.204254150390625, 0.2365875244140625, 0.2689208984375, 0.3012542724609375, 0.333587646484375, 0.3659210205078125, 0.39825439453125, 0.4305877685546875, 0.462921142578125, 0.4952545166015625, 0.527587890625, 0.5599212646484375, 0.592254638671875, 0.6245880126953125, 0.65692138671875, 0.6892547607421875, 0.721588134765625, 0.7539215087890625, 0.7862548828125, 0.8185882568359375, 0.850921630859375, 0.8832550048828125, 0.91558837890625, 0.9479217529296875, 0.980255126953125, 1.0125885009765625, 1.044921875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 10.0, 9.0, 9.0, 20.0, 28.0, 40.0, 63.0, 110.0, 146.0, 213.0, 335.0, 553.0, 872.0, 1865.0, 4383.0, 14832.0, 77468.0, 561147.0, 323038.0, 46319.0, 10096.0, 3351.0, 1501.0, 829.0, 495.0, 262.0, 193.0, 117.0, 93.0, 42.0, 34.0, 24.0, 21.0, 12.0, 9.0, 10.0, 5.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.904296875, -2.8101806640625, -2.716064453125, -2.6219482421875, -2.52783203125, -2.4337158203125, -2.339599609375, -2.2454833984375, -2.1513671875, -2.0572509765625, -1.963134765625, -1.8690185546875, -1.77490234375, -1.6807861328125, -1.586669921875, -1.4925537109375, -1.3984375, -1.3043212890625, -1.210205078125, -1.1160888671875, -1.02197265625, -0.9278564453125, -0.833740234375, -0.7396240234375, -0.6455078125, -0.5513916015625, -0.457275390625, -0.3631591796875, -0.26904296875, -0.1749267578125, -0.080810546875, 0.0133056640625, 0.107421875, 0.2015380859375, 0.295654296875, 0.3897705078125, 0.48388671875, 0.5780029296875, 0.672119140625, 0.7662353515625, 0.8603515625, 0.9544677734375, 1.048583984375, 1.1427001953125, 1.23681640625, 1.3309326171875, 1.425048828125, 1.5191650390625, 1.61328125, 1.7073974609375, 1.801513671875, 1.8956298828125, 1.98974609375, 2.0838623046875, 2.177978515625, 2.2720947265625, 2.3662109375, 2.4603271484375, 2.554443359375, 2.6485595703125, 2.74267578125, 2.8367919921875, 2.930908203125, 3.0250244140625, 3.119140625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 3.0, 3.0, 7.0, 3.0, 10.0, 7.0, 11.0, 9.0, 16.0, 14.0, 14.0, 18.0, 22.0, 28.0, 36.0, 37.0, 25.0, 46.0, 40.0, 36.0, 46.0, 53.0, 37.0, 45.0, 52.0, 37.0, 37.0, 44.0, 33.0, 42.0, 37.0, 27.0, 15.0, 25.0, 18.0, 16.0, 12.0, 3.0, 5.0, 8.0, 3.0, 7.0, 4.0, 2.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-3.626953125, -3.511871337890625, -3.39678955078125, -3.281707763671875, -3.1666259765625, -3.051544189453125, -2.93646240234375, -2.821380615234375, -2.706298828125, -2.591217041015625, -2.47613525390625, -2.361053466796875, -2.2459716796875, -2.130889892578125, -2.01580810546875, -1.900726318359375, -1.78564453125, -1.670562744140625, -1.55548095703125, -1.440399169921875, -1.3253173828125, -1.210235595703125, -1.09515380859375, -0.980072021484375, -0.864990234375, -0.749908447265625, -0.63482666015625, -0.519744873046875, -0.4046630859375, -0.289581298828125, -0.17449951171875, -0.059417724609375, 0.0556640625, 0.170745849609375, 0.28582763671875, 0.400909423828125, 0.5159912109375, 0.631072998046875, 0.74615478515625, 0.861236572265625, 0.976318359375, 1.091400146484375, 1.20648193359375, 1.321563720703125, 1.4366455078125, 1.551727294921875, 1.66680908203125, 1.781890869140625, 1.89697265625, 2.012054443359375, 2.12713623046875, 2.242218017578125, 2.3572998046875, 2.472381591796875, 2.58746337890625, 2.702545166015625, 2.817626953125, 2.932708740234375, 3.04779052734375, 3.162872314453125, 3.2779541015625, 3.393035888671875, 3.50811767578125, 3.623199462890625, 3.73828125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 6.0, 2.0, 1.0, 8.0, 16.0, 25.0, 41.0, 67.0, 114.0, 229.0, 451.0, 1068.0, 3575.0, 22706.0, 591134.0, 405261.0, 18668.0, 3258.0, 1078.0, 425.0, 181.0, 97.0, 46.0, 33.0, 24.0, 12.0, 13.0, 6.0, 4.0, 5.0, 2.0, 3.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.484375, -1.42718505859375, -1.3699951171875, -1.31280517578125, -1.255615234375, -1.19842529296875, -1.1412353515625, -1.08404541015625, -1.02685546875, -0.96966552734375, -0.9124755859375, -0.85528564453125, -0.798095703125, -0.74090576171875, -0.6837158203125, -0.62652587890625, -0.5693359375, -0.51214599609375, -0.4549560546875, -0.39776611328125, -0.340576171875, -0.28338623046875, -0.2261962890625, -0.16900634765625, -0.11181640625, -0.05462646484375, 0.0025634765625, 0.05975341796875, 0.116943359375, 0.17413330078125, 0.2313232421875, 0.28851318359375, 0.345703125, 0.40289306640625, 0.4600830078125, 0.51727294921875, 0.574462890625, 0.63165283203125, 0.6888427734375, 0.74603271484375, 0.80322265625, 0.86041259765625, 0.9176025390625, 0.97479248046875, 1.031982421875, 1.08917236328125, 1.1463623046875, 1.20355224609375, 1.2607421875, 1.31793212890625, 1.3751220703125, 1.43231201171875, 1.489501953125, 1.54669189453125, 1.6038818359375, 1.66107177734375, 1.71826171875, 1.77545166015625, 1.8326416015625, 1.88983154296875, 1.947021484375, 2.00421142578125, 2.0614013671875, 2.11859130859375, 2.17578125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 6.0, 7.0, 6.0, 11.0, 18.0, 16.0, 30.0, 32.0, 30.0, 40.0, 63.0, 74.0, 94.0, 101.0, 93.0, 81.0, 73.0, 70.0, 31.0, 37.0, 22.0, 18.0, 13.0, 11.0, 1.0, 8.0, 3.0, 2.0, 4.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.00025963783264160156, -0.00025326013565063477, -0.00024688243865966797, -0.00024050474166870117, -0.00023412704467773438, -0.00022774934768676758, -0.00022137165069580078, -0.00021499395370483398, -0.0002086162567138672, -0.0002022385597229004, -0.0001958608627319336, -0.0001894831657409668, -0.00018310546875, -0.0001767277717590332, -0.0001703500747680664, -0.0001639723777770996, -0.0001575946807861328, -0.00015121698379516602, -0.00014483928680419922, -0.00013846158981323242, -0.00013208389282226562, -0.00012570619583129883, -0.00011932849884033203, -0.00011295080184936523, -0.00010657310485839844, -0.00010019540786743164, -9.381771087646484e-05, -8.744001388549805e-05, -8.106231689453125e-05, -7.468461990356445e-05, -6.830692291259766e-05, -6.192922592163086e-05, -5.555152893066406e-05, -4.9173831939697266e-05, -4.279613494873047e-05, -3.641843795776367e-05, -3.0040740966796875e-05, -2.3663043975830078e-05, -1.728534698486328e-05, -1.0907649993896484e-05, -4.5299530029296875e-06, 1.8477439880371094e-06, 8.225440979003906e-06, 1.4603137969970703e-05, 2.09808349609375e-05, 2.7358531951904297e-05, 3.3736228942871094e-05, 4.011392593383789e-05, 4.649162292480469e-05, 5.2869319915771484e-05, 5.924701690673828e-05, 6.562471389770508e-05, 7.200241088867188e-05, 7.838010787963867e-05, 8.475780487060547e-05, 9.113550186157227e-05, 9.751319885253906e-05, 0.00010389089584350586, 0.00011026859283447266, 0.00011664628982543945, 0.00012302398681640625, 0.00012940168380737305, 0.00013577938079833984, 0.00014215707778930664, 0.00014853477478027344]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 3.0, 7.0, 9.0, 20.0, 22.0, 31.0, 43.0, 76.0, 148.0, 277.0, 554.0, 1278.0, 3431.0, 13945.0, 123505.0, 764892.0, 120715.0, 13728.0, 3409.0, 1228.0, 540.0, 271.0, 161.0, 97.0, 60.0, 37.0, 27.0, 14.0, 8.0, 4.0, 2.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0], "bins": [-1.8603515625, -1.8165740966796875, -1.772796630859375, -1.7290191650390625, -1.68524169921875, -1.6414642333984375, -1.597686767578125, -1.5539093017578125, -1.5101318359375, -1.4663543701171875, -1.422576904296875, -1.3787994384765625, -1.33502197265625, -1.2912445068359375, -1.247467041015625, -1.2036895751953125, -1.159912109375, -1.1161346435546875, -1.072357177734375, -1.0285797119140625, -0.98480224609375, -0.9410247802734375, -0.897247314453125, -0.8534698486328125, -0.8096923828125, -0.7659149169921875, -0.722137451171875, -0.6783599853515625, -0.63458251953125, -0.5908050537109375, -0.547027587890625, -0.5032501220703125, -0.45947265625, -0.4156951904296875, -0.371917724609375, -0.3281402587890625, -0.28436279296875, -0.2405853271484375, -0.196807861328125, -0.1530303955078125, -0.1092529296875, -0.0654754638671875, -0.021697998046875, 0.0220794677734375, 0.06585693359375, 0.1096343994140625, 0.153411865234375, 0.1971893310546875, 0.240966796875, 0.2847442626953125, 0.328521728515625, 0.3722991943359375, 0.41607666015625, 0.4598541259765625, 0.503631591796875, 0.5474090576171875, 0.5911865234375, 0.6349639892578125, 0.678741455078125, 0.7225189208984375, 0.76629638671875, 0.8100738525390625, 0.853851318359375, 0.8976287841796875, 0.94140625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 4.0, 4.0, 10.0, 21.0, 24.0, 36.0, 42.0, 74.0, 78.0, 62.0, 92.0, 116.0, 96.0, 90.0, 69.0, 44.0, 41.0, 29.0, 29.0, 14.0, 4.0, 11.0, 6.0, 0.0, 7.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.103515625, -2.0527496337890625, -2.001983642578125, -1.9512176513671875, -1.90045166015625, -1.8496856689453125, -1.798919677734375, -1.7481536865234375, -1.6973876953125, -1.6466217041015625, -1.595855712890625, -1.5450897216796875, -1.49432373046875, -1.4435577392578125, -1.392791748046875, -1.3420257568359375, -1.291259765625, -1.2404937744140625, -1.189727783203125, -1.1389617919921875, -1.08819580078125, -1.0374298095703125, -0.986663818359375, -0.9358978271484375, -0.8851318359375, -0.8343658447265625, -0.783599853515625, -0.7328338623046875, -0.68206787109375, -0.6313018798828125, -0.580535888671875, -0.5297698974609375, -0.47900390625, -0.4282379150390625, -0.377471923828125, -0.3267059326171875, -0.27593994140625, -0.2251739501953125, -0.174407958984375, -0.1236419677734375, -0.0728759765625, -0.0221099853515625, 0.028656005859375, 0.0794219970703125, 0.13018798828125, 0.1809539794921875, 0.231719970703125, 0.2824859619140625, 0.333251953125, 0.3840179443359375, 0.434783935546875, 0.4855499267578125, 0.53631591796875, 0.5870819091796875, 0.637847900390625, 0.6886138916015625, 0.7393798828125, 0.7901458740234375, 0.840911865234375, 0.8916778564453125, 0.94244384765625, 0.9932098388671875, 1.043975830078125, 1.0947418212890625, 1.1455078125]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 10.0, 6.0, 21.0, 107.0, 242.0, 357.0, 193.0, 48.0, 11.0, 7.0, 5.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.57146453857422, -38.9788818359375, -37.38629913330078, -35.79371643066406, -34.201133728027344, -32.608551025390625, -31.01597023010254, -29.42338752746582, -27.8308048248291, -26.238222122192383, -24.645639419555664, -23.053058624267578, -21.46047592163086, -19.86789321899414, -18.275310516357422, -16.682727813720703, -15.090145111083984, -13.497562408447266, -11.904979705810547, -10.312397956848145, -8.719815254211426, -7.127232551574707, -5.534650802612305, -3.942068099975586, -2.349485397338867, -0.7569029331207275, 0.8356795310974121, 2.4282617568969727, 4.020844459533691, 5.61342716217041, 7.2060089111328125, 8.798591613769531, 10.391170501708984, 11.983753204345703, 13.576335906982422, 15.168917655944824, 16.76150131225586, 18.354084014892578, 19.946664810180664, 21.539247512817383, 23.1318302154541, 24.72441291809082, 26.31699562072754, 27.909576416015625, 29.502159118652344, 31.094741821289062, 32.68732452392578, 34.2799072265625, 35.87248992919922, 37.46507263183594, 39.057655334472656, 40.650238037109375, 42.242820739746094, 43.83540344238281, 45.42798614501953, 47.02056884765625, 48.61315155029297, 50.20573425292969, 51.798316955566406, 53.390899658203125, 54.983482360839844, 56.57606506347656, 58.16864776611328, 59.76123046875, 61.35380935668945]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 5.0, 5.0, 8.0, 11.0, 9.0, 16.0, 13.0, 23.0, 35.0, 30.0, 30.0, 49.0, 74.0, 73.0, 71.0, 81.0, 77.0, 58.0, 63.0, 51.0, 44.0, 50.0, 30.0, 23.0, 16.0, 10.0, 12.0, 19.0, 8.0, 5.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.497474670410156, -23.804574966430664, -23.11167335510254, -22.418773651123047, -21.725872039794922, -21.03297233581543, -20.340072631835938, -19.647171020507812, -18.95427131652832, -18.261371612548828, -17.568470001220703, -16.87557029724121, -16.18267059326172, -15.489768981933594, -14.796869277954102, -14.103968620300293, -13.411067962646484, -12.718167304992676, -12.025266647338867, -11.332366943359375, -10.639466285705566, -9.946565628051758, -9.253665924072266, -8.560765266418457, -7.867864608764648, -7.17496395111084, -6.4820637702941895, -5.789163589477539, -5.0962629318237305, -4.403362274169922, -3.7104620933532715, -3.017561912536621, -2.3246631622314453, -1.6317627429962158, -0.9388623237609863, -0.24596190452575684, 0.44693851470947266, 1.1398389339447021, 1.8327393531799316, 2.525639533996582, 3.2185401916503906, 3.91144061088562, 4.60434103012085, 5.2972412109375, 5.990141868591309, 6.683042526245117, 7.375942707061768, 8.068842887878418, 8.761743545532227, 9.454644203186035, 10.147544860839844, 10.840444564819336, 11.533345222473145, 12.226245880126953, 12.919145584106445, 13.612046241760254, 14.304946899414062, 14.997847557067871, 15.69074821472168, 16.383647918701172, 17.076549530029297, 17.76944923400879, 18.46234893798828, 19.155250549316406, 19.8481502532959]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 1.0, 3.0, 5.0, 9.0, 13.0, 13.0, 12.0, 15.0, 30.0, 24.0, 45.0, 77.0, 116.0, 222.0, 619.0, 4986.0, 170221.0, 3997475.0, 18003.0, 1497.0, 383.0, 170.0, 99.0, 71.0, 46.0, 32.0, 24.0, 19.0, 12.0, 14.0, 7.0, 8.0, 4.0, 1.0, 1.0, 6.0, 2.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.03125, -5.86016845703125, -5.6890869140625, -5.51800537109375, -5.346923828125, -5.17584228515625, -5.0047607421875, -4.83367919921875, -4.66259765625, -4.49151611328125, -4.3204345703125, -4.14935302734375, -3.978271484375, -3.80718994140625, -3.6361083984375, -3.46502685546875, -3.2939453125, -3.12286376953125, -2.9517822265625, -2.78070068359375, -2.609619140625, -2.43853759765625, -2.2674560546875, -2.09637451171875, -1.92529296875, -1.75421142578125, -1.5831298828125, -1.41204833984375, -1.240966796875, -1.06988525390625, -0.8988037109375, -0.72772216796875, -0.556640625, -0.38555908203125, -0.2144775390625, -0.04339599609375, 0.127685546875, 0.29876708984375, 0.4698486328125, 0.64093017578125, 0.81201171875, 0.98309326171875, 1.1541748046875, 1.32525634765625, 1.496337890625, 1.66741943359375, 1.8385009765625, 2.00958251953125, 2.1806640625, 2.35174560546875, 2.5228271484375, 2.69390869140625, 2.864990234375, 3.03607177734375, 3.2071533203125, 3.37823486328125, 3.54931640625, 3.72039794921875, 3.8914794921875, 4.06256103515625, 4.233642578125, 4.40472412109375, 4.5758056640625, 4.74688720703125, 4.91796875]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 7.0, 12.0, 22.0, 42.0, 69.0, 99.0, 137.0, 125.0, 147.0, 116.0, 95.0, 55.0, 46.0, 20.0, 4.0, 4.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.365234375, -2.280487060546875, -2.19573974609375, -2.110992431640625, -2.0262451171875, -1.941497802734375, -1.85675048828125, -1.772003173828125, -1.687255859375, -1.602508544921875, -1.51776123046875, -1.433013916015625, -1.3482666015625, -1.263519287109375, -1.17877197265625, -1.094024658203125, -1.00927734375, -0.924530029296875, -0.83978271484375, -0.755035400390625, -0.6702880859375, -0.585540771484375, -0.50079345703125, -0.416046142578125, -0.331298828125, -0.246551513671875, -0.16180419921875, -0.077056884765625, 0.0076904296875, 0.092437744140625, 0.17718505859375, 0.261932373046875, 0.3466796875, 0.431427001953125, 0.51617431640625, 0.600921630859375, 0.6856689453125, 0.770416259765625, 0.85516357421875, 0.939910888671875, 1.024658203125, 1.109405517578125, 1.19415283203125, 1.278900146484375, 1.3636474609375, 1.448394775390625, 1.53314208984375, 1.617889404296875, 1.70263671875, 1.787384033203125, 1.87213134765625, 1.956878662109375, 2.0416259765625, 2.126373291015625, 2.21112060546875, 2.295867919921875, 2.380615234375, 2.465362548828125, 2.55010986328125, 2.634857177734375, 2.7196044921875, 2.804351806640625, 2.88909912109375, 2.973846435546875, 3.05859375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 2.0, 10.0, 2.0, 8.0, 3.0, 14.0, 10.0, 25.0, 36.0, 76.0, 155.0, 291.0, 691.0, 1528.0, 3573.0, 9308.0, 25867.0, 103746.0, 1586633.0, 2290769.0, 123967.0, 29106.0, 10393.0, 4275.0, 1946.0, 860.0, 427.0, 246.0, 122.0, 70.0, 35.0, 32.0, 22.0, 11.0, 9.0, 2.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.52734375, -1.468719482421875, -1.41009521484375, -1.351470947265625, -1.2928466796875, -1.234222412109375, -1.17559814453125, -1.116973876953125, -1.058349609375, -0.999725341796875, -0.94110107421875, -0.882476806640625, -0.8238525390625, -0.765228271484375, -0.70660400390625, -0.647979736328125, -0.58935546875, -0.530731201171875, -0.47210693359375, -0.413482666015625, -0.3548583984375, -0.296234130859375, -0.23760986328125, -0.178985595703125, -0.120361328125, -0.061737060546875, -0.00311279296875, 0.055511474609375, 0.1141357421875, 0.172760009765625, 0.23138427734375, 0.290008544921875, 0.3486328125, 0.407257080078125, 0.46588134765625, 0.524505615234375, 0.5831298828125, 0.641754150390625, 0.70037841796875, 0.759002685546875, 0.817626953125, 0.876251220703125, 0.93487548828125, 0.993499755859375, 1.0521240234375, 1.110748291015625, 1.16937255859375, 1.227996826171875, 1.28662109375, 1.345245361328125, 1.40386962890625, 1.462493896484375, 1.5211181640625, 1.579742431640625, 1.63836669921875, 1.696990966796875, 1.755615234375, 1.814239501953125, 1.87286376953125, 1.931488037109375, 1.9901123046875, 2.048736572265625, 2.10736083984375, 2.165985107421875, 2.224609375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 2.0, 4.0, 3.0, 5.0, 6.0, 5.0, 10.0, 7.0, 6.0, 17.0, 16.0, 32.0, 30.0, 56.0, 80.0, 121.0, 237.0, 401.0, 725.0, 868.0, 592.0, 308.0, 182.0, 104.0, 73.0, 43.0, 35.0, 21.0, 19.0, 9.0, 11.0, 5.0, 9.0, 4.0, 6.0, 6.0, 5.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.376953125, -1.318084716796875, -1.25921630859375, -1.200347900390625, -1.1414794921875, -1.082611083984375, -1.02374267578125, -0.964874267578125, -0.906005859375, -0.847137451171875, -0.78826904296875, -0.729400634765625, -0.6705322265625, -0.611663818359375, -0.55279541015625, -0.493927001953125, -0.43505859375, -0.376190185546875, -0.31732177734375, -0.258453369140625, -0.1995849609375, -0.140716552734375, -0.08184814453125, -0.022979736328125, 0.035888671875, 0.094757080078125, 0.15362548828125, 0.212493896484375, 0.2713623046875, 0.330230712890625, 0.38909912109375, 0.447967529296875, 0.5068359375, 0.565704345703125, 0.62457275390625, 0.683441162109375, 0.7423095703125, 0.801177978515625, 0.86004638671875, 0.918914794921875, 0.977783203125, 1.036651611328125, 1.09552001953125, 1.154388427734375, 1.2132568359375, 1.272125244140625, 1.33099365234375, 1.389862060546875, 1.44873046875, 1.507598876953125, 1.56646728515625, 1.625335693359375, 1.6842041015625, 1.743072509765625, 1.80194091796875, 1.860809326171875, 1.919677734375, 1.978546142578125, 2.03741455078125, 2.096282958984375, 2.1551513671875, 2.214019775390625, 2.27288818359375, 2.331756591796875, 2.390625]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 8.0, 4.0, 7.0, 17.0, 55.0, 126.0, 255.0, 266.0, 154.0, 63.0, 29.0, 11.0, 4.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-39.99540328979492, -39.19813537597656, -38.40087127685547, -37.60360336303711, -36.80633544921875, -36.00906753540039, -35.2118034362793, -34.41453552246094, -33.61726760864258, -32.81999969482422, -32.022735595703125, -31.225467681884766, -30.428199768066406, -29.63093376159668, -28.833667755126953, -28.036399841308594, -27.239133834838867, -26.44186782836914, -25.64459991455078, -24.847333908081055, -24.050065994262695, -23.25279998779297, -22.45553207397461, -21.658266067504883, -20.861000061035156, -20.06373405456543, -19.26646614074707, -18.469200134277344, -17.671932220458984, -16.874666213989258, -16.07740020751953, -15.280132293701172, -14.482866287231445, -13.685599327087402, -12.88833236694336, -12.091066360473633, -11.293798446655273, -10.496532440185547, -9.699265480041504, -8.901998519897461, -8.104731559753418, -7.307464599609375, -6.510197639465332, -5.712931156158447, -4.915664196014404, -4.118397235870361, -3.3211307525634766, -2.5238637924194336, -1.7265968322753906, -0.9293299913406372, -0.1320631504058838, 0.6652035713195801, 1.462470531463623, 2.259737491607666, 3.057003974914551, 3.8542709350585938, 4.651537895202637, 5.44880485534668, 6.246071815490723, 7.043338298797607, 7.84060525894165, 8.637872695922852, 9.435138702392578, 10.232405662536621, 11.029672622680664]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 3.0, 4.0, 5.0, 9.0, 6.0, 19.0, 11.0, 22.0, 23.0, 24.0, 30.0, 34.0, 46.0, 47.0, 49.0, 55.0, 49.0, 59.0, 55.0, 58.0, 52.0, 37.0, 35.0, 39.0, 28.0, 43.0, 33.0, 23.0, 21.0, 21.0, 20.0, 7.0, 4.0, 8.0, 1.0, 8.0, 5.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-11.039276123046875, -10.732244491577148, -10.425213813781738, -10.118182182312012, -9.811151504516602, -9.504119873046875, -9.197089195251465, -8.890057563781738, -8.583026885986328, -8.275995254516602, -7.968964576721191, -7.661933422088623, -7.354902267456055, -7.047871112823486, -6.740839958190918, -6.433808326721191, -6.126777172088623, -5.819746017456055, -5.512714862823486, -5.205683708190918, -4.89865255355835, -4.591621398925781, -4.284589767456055, -3.9775588512420654, -3.670527696609497, -3.3634965419769287, -3.0564653873443604, -2.749433994293213, -2.4424028396606445, -2.135371685028076, -1.8283405303955078, -1.5213093757629395, -1.214278221130371, -0.9072470664978027, -0.6002158522605896, -0.29318463802337646, 0.013846516609191895, 0.32087767124176025, 0.6279089450836182, 0.9349400997161865, 1.2419712543487549, 1.5490024089813232, 1.8560335636138916, 2.163064956665039, 2.4700961112976074, 2.777127265930176, 3.084158420562744, 3.3911895751953125, 3.698220729827881, 4.005251884460449, 4.312283039093018, 4.619314193725586, 4.926345348358154, 5.233376502990723, 5.540408134460449, 5.847438812255859, 6.154470443725586, 6.461501598358154, 6.768532752990723, 7.075563907623291, 7.382595062255859, 7.689626216888428, 7.996657371520996, 8.303689002990723, 8.610719680786133]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 2.0, 4.0, 9.0, 10.0, 5.0, 9.0, 22.0, 28.0, 45.0, 83.0, 127.0, 222.0, 370.0, 760.0, 1398.0, 3137.0, 7238.0, 18420.0, 50847.0, 153870.0, 381970.0, 280231.0, 95131.0, 32760.0, 12184.0, 5114.0, 2258.0, 1047.0, 560.0, 270.0, 152.0, 112.0, 64.0, 35.0, 26.0, 12.0, 14.0, 4.0, 5.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.9775390625, -1.91900634765625, -1.8604736328125, -1.80194091796875, -1.743408203125, -1.68487548828125, -1.6263427734375, -1.56781005859375, -1.50927734375, -1.45074462890625, -1.3922119140625, -1.33367919921875, -1.275146484375, -1.21661376953125, -1.1580810546875, -1.09954833984375, -1.041015625, -0.98248291015625, -0.9239501953125, -0.86541748046875, -0.806884765625, -0.74835205078125, -0.6898193359375, -0.63128662109375, -0.57275390625, -0.51422119140625, -0.4556884765625, -0.39715576171875, -0.338623046875, -0.28009033203125, -0.2215576171875, -0.16302490234375, -0.1044921875, -0.04595947265625, 0.0125732421875, 0.07110595703125, 0.129638671875, 0.18817138671875, 0.2467041015625, 0.30523681640625, 0.36376953125, 0.42230224609375, 0.4808349609375, 0.53936767578125, 0.597900390625, 0.65643310546875, 0.7149658203125, 0.77349853515625, 0.83203125, 0.89056396484375, 0.9490966796875, 1.00762939453125, 1.066162109375, 1.12469482421875, 1.1832275390625, 1.24176025390625, 1.30029296875, 1.35882568359375, 1.4173583984375, 1.47589111328125, 1.534423828125, 1.59295654296875, 1.6514892578125, 1.71002197265625, 1.7685546875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 6.0, 1.0, 5.0, 8.0, 10.0, 17.0, 22.0, 33.0, 42.0, 48.0, 61.0, 67.0, 78.0, 113.0, 80.0, 86.0, 82.0, 67.0, 44.0, 50.0, 31.0, 19.0, 15.0, 7.0, 10.0, 6.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.779296875, -1.7284393310546875, -1.677581787109375, -1.6267242431640625, -1.57586669921875, -1.5250091552734375, -1.474151611328125, -1.4232940673828125, -1.3724365234375, -1.3215789794921875, -1.270721435546875, -1.2198638916015625, -1.16900634765625, -1.1181488037109375, -1.067291259765625, -1.0164337158203125, -0.965576171875, -0.9147186279296875, -0.863861083984375, -0.8130035400390625, -0.76214599609375, -0.7112884521484375, -0.660430908203125, -0.6095733642578125, -0.5587158203125, -0.5078582763671875, -0.457000732421875, -0.4061431884765625, -0.35528564453125, -0.3044281005859375, -0.253570556640625, -0.2027130126953125, -0.15185546875, -0.1009979248046875, -0.050140380859375, 0.0007171630859375, 0.05157470703125, 0.1024322509765625, 0.153289794921875, 0.2041473388671875, 0.2550048828125, 0.3058624267578125, 0.356719970703125, 0.4075775146484375, 0.45843505859375, 0.5092926025390625, 0.560150146484375, 0.6110076904296875, 0.661865234375, 0.7127227783203125, 0.763580322265625, 0.8144378662109375, 0.86529541015625, 0.9161529541015625, 0.967010498046875, 1.0178680419921875, 1.0687255859375, 1.1195831298828125, 1.170440673828125, 1.2212982177734375, 1.27215576171875, 1.3230133056640625, 1.373870849609375, 1.4247283935546875, 1.4755859375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 2.0, 8.0, 11.0, 13.0, 18.0, 17.0, 30.0, 59.0, 61.0, 94.0, 143.0, 201.0, 399.0, 703.0, 1519.0, 4191.0, 15835.0, 88121.0, 595014.0, 285102.0, 42752.0, 9047.0, 2773.0, 1107.0, 547.0, 290.0, 179.0, 104.0, 63.0, 47.0, 29.0, 21.0, 8.0, 8.0, 6.0, 7.0, 9.0, 3.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-2.93359375, -2.841339111328125, -2.74908447265625, -2.656829833984375, -2.5645751953125, -2.472320556640625, -2.38006591796875, -2.287811279296875, -2.195556640625, -2.103302001953125, -2.01104736328125, -1.918792724609375, -1.8265380859375, -1.734283447265625, -1.64202880859375, -1.549774169921875, -1.45751953125, -1.365264892578125, -1.27301025390625, -1.180755615234375, -1.0885009765625, -0.996246337890625, -0.90399169921875, -0.811737060546875, -0.719482421875, -0.627227783203125, -0.53497314453125, -0.442718505859375, -0.3504638671875, -0.258209228515625, -0.16595458984375, -0.073699951171875, 0.0185546875, 0.110809326171875, 0.20306396484375, 0.295318603515625, 0.3875732421875, 0.479827880859375, 0.57208251953125, 0.664337158203125, 0.756591796875, 0.848846435546875, 0.94110107421875, 1.033355712890625, 1.1256103515625, 1.217864990234375, 1.31011962890625, 1.402374267578125, 1.49462890625, 1.586883544921875, 1.67913818359375, 1.771392822265625, 1.8636474609375, 1.955902099609375, 2.04815673828125, 2.140411376953125, 2.232666015625, 2.324920654296875, 2.41717529296875, 2.509429931640625, 2.6016845703125, 2.693939208984375, 2.78619384765625, 2.878448486328125, 2.970703125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 1.0, 4.0, 9.0, 3.0, 0.0, 8.0, 5.0, 14.0, 6.0, 13.0, 12.0, 14.0, 16.0, 20.0, 25.0, 27.0, 26.0, 39.0, 39.0, 33.0, 53.0, 61.0, 43.0, 54.0, 47.0, 60.0, 50.0, 41.0, 50.0, 32.0, 25.0, 31.0, 33.0, 17.0, 13.0, 13.0, 16.0, 14.0, 8.0, 8.0, 6.0, 2.0, 3.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.451171875, -3.3446044921875, -3.238037109375, -3.1314697265625, -3.02490234375, -2.9183349609375, -2.811767578125, -2.7052001953125, -2.5986328125, -2.4920654296875, -2.385498046875, -2.2789306640625, -2.17236328125, -2.0657958984375, -1.959228515625, -1.8526611328125, -1.74609375, -1.6395263671875, -1.532958984375, -1.4263916015625, -1.31982421875, -1.2132568359375, -1.106689453125, -1.0001220703125, -0.8935546875, -0.7869873046875, -0.680419921875, -0.5738525390625, -0.46728515625, -0.3607177734375, -0.254150390625, -0.1475830078125, -0.041015625, 0.0655517578125, 0.172119140625, 0.2786865234375, 0.38525390625, 0.4918212890625, 0.598388671875, 0.7049560546875, 0.8115234375, 0.9180908203125, 1.024658203125, 1.1312255859375, 1.23779296875, 1.3443603515625, 1.450927734375, 1.5574951171875, 1.6640625, 1.7706298828125, 1.877197265625, 1.9837646484375, 2.09033203125, 2.1968994140625, 2.303466796875, 2.4100341796875, 2.5166015625, 2.6231689453125, 2.729736328125, 2.8363037109375, 2.94287109375, 3.0494384765625, 3.156005859375, 3.2625732421875, 3.369140625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 15.0, 25.0, 30.0, 93.0, 242.0, 1038.0, 11156.0, 936631.0, 96247.0, 2386.0, 430.0, 132.0, 47.0, 37.0, 16.0, 8.0, 7.0, 5.0, 3.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.677734375, -1.588165283203125, -1.49859619140625, -1.409027099609375, -1.3194580078125, -1.229888916015625, -1.14031982421875, -1.050750732421875, -0.961181640625, -0.871612548828125, -0.78204345703125, -0.692474365234375, -0.6029052734375, -0.513336181640625, -0.42376708984375, -0.334197998046875, -0.24462890625, -0.155059814453125, -0.06549072265625, 0.024078369140625, 0.1136474609375, 0.203216552734375, 0.29278564453125, 0.382354736328125, 0.471923828125, 0.561492919921875, 0.65106201171875, 0.740631103515625, 0.8302001953125, 0.919769287109375, 1.00933837890625, 1.098907470703125, 1.1884765625, 1.278045654296875, 1.36761474609375, 1.457183837890625, 1.5467529296875, 1.636322021484375, 1.72589111328125, 1.815460205078125, 1.905029296875, 1.994598388671875, 2.08416748046875, 2.173736572265625, 2.2633056640625, 2.352874755859375, 2.44244384765625, 2.532012939453125, 2.62158203125, 2.711151123046875, 2.80072021484375, 2.890289306640625, 2.9798583984375, 3.069427490234375, 3.15899658203125, 3.248565673828125, 3.338134765625, 3.427703857421875, 3.51727294921875, 3.606842041015625, 3.6964111328125, 3.785980224609375, 3.87554931640625, 3.965118408203125, 4.0546875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 1.0, 3.0, 1.0, 3.0, 3.0, 2.0, 5.0, 4.0, 8.0, 10.0, 14.0, 12.0, 14.0, 17.0, 35.0, 35.0, 46.0, 55.0, 48.0, 59.0, 56.0, 89.0, 60.0, 68.0, 57.0, 52.0, 40.0, 42.0, 24.0, 27.0, 21.0, 19.0, 12.0, 11.0, 11.0, 9.0, 8.0, 4.0, 0.0, 3.0, 2.0, 4.0, 1.0, 6.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.0001404285430908203, -0.00013588741421699524, -0.00013134628534317017, -0.0001268051564693451, -0.00012226402759552002, -0.00011772289872169495, -0.00011318176984786987, -0.0001086406409740448, -0.00010409951210021973, -9.955838322639465e-05, -9.501725435256958e-05, -9.047612547874451e-05, -8.593499660491943e-05, -8.139386773109436e-05, -7.685273885726929e-05, -7.231160998344421e-05, -6.777048110961914e-05, -6.322935223579407e-05, -5.8688223361968994e-05, -5.414709448814392e-05, -4.960596561431885e-05, -4.5064836740493774e-05, -4.05237078666687e-05, -3.598257899284363e-05, -3.1441450119018555e-05, -2.690032124519348e-05, -2.2359192371368408e-05, -1.7818063497543335e-05, -1.3276934623718262e-05, -8.735805749893188e-06, -4.194676876068115e-06, 3.46451997756958e-07, 4.887580871582031e-06, 9.428709745407104e-06, 1.3969838619232178e-05, 1.851096749305725e-05, 2.3052096366882324e-05, 2.7593225240707397e-05, 3.213435411453247e-05, 3.6675482988357544e-05, 4.121661186218262e-05, 4.575774073600769e-05, 5.0298869609832764e-05, 5.483999848365784e-05, 5.938112735748291e-05, 6.392225623130798e-05, 6.846338510513306e-05, 7.300451397895813e-05, 7.75456428527832e-05, 8.208677172660828e-05, 8.662790060043335e-05, 9.116902947425842e-05, 9.57101583480835e-05, 0.00010025128722190857, 0.00010479241609573364, 0.00010933354496955872, 0.00011387467384338379, 0.00011841580271720886, 0.00012295693159103394, 0.000127498060464859, 0.00013203918933868408, 0.00013658031821250916, 0.00014112144708633423, 0.0001456625759601593, 0.00015020370483398438]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 4.0, 3.0, 3.0, 5.0, 10.0, 13.0, 21.0, 41.0, 51.0, 71.0, 157.0, 271.0, 621.0, 1441.0, 4864.0, 34892.0, 689701.0, 294675.0, 16544.0, 3118.0, 1022.0, 467.0, 227.0, 114.0, 80.0, 49.0, 40.0, 20.0, 10.0, 9.0, 5.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.560546875, -1.5157623291015625, -1.470977783203125, -1.4261932373046875, -1.38140869140625, -1.3366241455078125, -1.291839599609375, -1.2470550537109375, -1.2022705078125, -1.1574859619140625, -1.112701416015625, -1.0679168701171875, -1.02313232421875, -0.9783477783203125, -0.933563232421875, -0.8887786865234375, -0.843994140625, -0.7992095947265625, -0.754425048828125, -0.7096405029296875, -0.66485595703125, -0.6200714111328125, -0.575286865234375, -0.5305023193359375, -0.4857177734375, -0.4409332275390625, -0.396148681640625, -0.3513641357421875, -0.30657958984375, -0.2617950439453125, -0.217010498046875, -0.1722259521484375, -0.12744140625, -0.0826568603515625, -0.037872314453125, 0.0069122314453125, 0.05169677734375, 0.0964813232421875, 0.141265869140625, 0.1860504150390625, 0.2308349609375, 0.2756195068359375, 0.320404052734375, 0.3651885986328125, 0.40997314453125, 0.4547576904296875, 0.499542236328125, 0.5443267822265625, 0.589111328125, 0.6338958740234375, 0.678680419921875, 0.7234649658203125, 0.76824951171875, 0.8130340576171875, 0.857818603515625, 0.9026031494140625, 0.9473876953125, 0.9921722412109375, 1.036956787109375, 1.0817413330078125, 1.12652587890625, 1.1713104248046875, 1.216094970703125, 1.2608795166015625, 1.3056640625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 2.0, 8.0, 7.0, 15.0, 33.0, 33.0, 60.0, 81.0, 81.0, 118.0, 126.0, 113.0, 104.0, 80.0, 57.0, 35.0, 21.0, 14.0, 8.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.17578125, -1.129730224609375, -1.08367919921875, -1.037628173828125, -0.9915771484375, -0.945526123046875, -0.89947509765625, -0.853424072265625, -0.807373046875, -0.761322021484375, -0.71527099609375, -0.669219970703125, -0.6231689453125, -0.577117919921875, -0.53106689453125, -0.485015869140625, -0.43896484375, -0.392913818359375, -0.34686279296875, -0.300811767578125, -0.2547607421875, -0.208709716796875, -0.16265869140625, -0.116607666015625, -0.070556640625, -0.024505615234375, 0.02154541015625, 0.067596435546875, 0.1136474609375, 0.159698486328125, 0.20574951171875, 0.251800537109375, 0.2978515625, 0.343902587890625, 0.38995361328125, 0.436004638671875, 0.4820556640625, 0.528106689453125, 0.57415771484375, 0.620208740234375, 0.666259765625, 0.712310791015625, 0.75836181640625, 0.804412841796875, 0.8504638671875, 0.896514892578125, 0.94256591796875, 0.988616943359375, 1.03466796875, 1.080718994140625, 1.12677001953125, 1.172821044921875, 1.2188720703125, 1.264923095703125, 1.31097412109375, 1.357025146484375, 1.403076171875, 1.449127197265625, 1.49517822265625, 1.541229248046875, 1.5872802734375, 1.633331298828125, 1.67938232421875, 1.725433349609375, 1.771484375]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 7.0, 22.0, 65.0, 94.0, 209.0, 289.0, 167.0, 99.0, 26.0, 8.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-44.257118225097656, -43.23796463012695, -42.218814849853516, -41.19966125488281, -40.180511474609375, -39.16135787963867, -38.14220428466797, -37.12305450439453, -36.10390090942383, -35.084747314453125, -34.06559753417969, -33.046443939208984, -32.02729034423828, -31.008140563964844, -29.98898696899414, -28.96983528137207, -27.95068359375, -26.93153190612793, -25.91238021850586, -24.893226623535156, -23.874074935913086, -22.854923248291016, -21.835769653320312, -20.816617965698242, -19.797466278076172, -18.7783145904541, -17.75916290283203, -16.740009307861328, -15.720857620239258, -14.701705932617188, -13.6825532913208, -12.663400650024414, -11.644245147705078, -10.625093460083008, -9.605940818786621, -8.586788177490234, -7.567636489868164, -6.5484843254089355, -5.529332160949707, -4.5101799964904785, -3.49102783203125, -2.4718756675720215, -1.452723503112793, -0.43357133865356445, 0.5855808258056641, 1.6047329902648926, 2.623885154724121, 3.6430373191833496, 4.662189483642578, 5.681341648101807, 6.700493812561035, 7.719645977020264, 8.738798141479492, 9.757949829101562, 10.77710247039795, 11.796255111694336, 12.815406799316406, 13.834558486938477, 14.853711128234863, 15.87286376953125, 16.89201545715332, 17.91116714477539, 18.930320739746094, 19.949472427368164, 20.968624114990234]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 5.0, 4.0, 8.0, 11.0, 16.0, 27.0, 27.0, 27.0, 39.0, 60.0, 61.0, 62.0, 69.0, 96.0, 99.0, 65.0, 61.0, 52.0, 52.0, 35.0, 45.0, 35.0, 13.0, 21.0, 8.0, 8.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.88585662841797, -20.139802932739258, -19.393747329711914, -18.647693634033203, -17.90163803100586, -17.15558433532715, -16.409530639648438, -15.66347599029541, -14.917421340942383, -14.171366691589355, -13.425312042236328, -12.679258346557617, -11.93320369720459, -11.187149047851562, -10.441095352172852, -9.695040702819824, -8.948986053466797, -8.20293140411377, -7.4568772315979, -6.710823059082031, -5.964768409729004, -5.218713760375977, -4.472659587860107, -3.7266054153442383, -2.980550765991211, -2.2344963550567627, -1.4884419441223145, -0.7423875331878662, 0.0036668777465820312, 0.7497212886810303, 1.4957756996154785, 2.2418298721313477, 2.987882614135742, 3.7339370250701904, 4.479991436004639, 5.226045608520508, 5.972100257873535, 6.7181549072265625, 7.464209079742432, 8.2102632522583, 8.956317901611328, 9.702372550964355, 10.448427200317383, 11.194480895996094, 11.940535545349121, 12.686590194702148, 13.43264389038086, 14.178698539733887, 14.924753189086914, 15.670807838439941, 16.41686248779297, 17.16291618347168, 17.90896987915039, 18.655025482177734, 19.401079177856445, 20.147132873535156, 20.8931884765625, 21.63924217224121, 22.385297775268555, 23.131351470947266, 23.87740707397461, 24.62346076965332, 25.36951446533203, 26.115570068359375, 26.861623764038086]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 8.0, 4.0, 10.0, 19.0, 31.0, 48.0, 80.0, 130.0, 252.0, 559.0, 1200.0, 3149.0, 10871.0, 55866.0, 743970.0, 3059850.0, 278162.0, 29675.0, 6513.0, 2050.0, 863.0, 432.0, 210.0, 118.0, 81.0, 42.0, 30.0, 22.0, 10.0, 9.0, 6.0, 5.0, 5.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.306640625, -1.25506591796875, -1.2034912109375, -1.15191650390625, -1.100341796875, -1.04876708984375, -0.9971923828125, -0.94561767578125, -0.89404296875, -0.84246826171875, -0.7908935546875, -0.73931884765625, -0.687744140625, -0.63616943359375, -0.5845947265625, -0.53302001953125, -0.4814453125, -0.42987060546875, -0.3782958984375, -0.32672119140625, -0.275146484375, -0.22357177734375, -0.1719970703125, -0.12042236328125, -0.06884765625, -0.01727294921875, 0.0343017578125, 0.08587646484375, 0.137451171875, 0.18902587890625, 0.2406005859375, 0.29217529296875, 0.34375, 0.39532470703125, 0.4468994140625, 0.49847412109375, 0.550048828125, 0.60162353515625, 0.6531982421875, 0.70477294921875, 0.75634765625, 0.80792236328125, 0.8594970703125, 0.91107177734375, 0.962646484375, 1.01422119140625, 1.0657958984375, 1.11737060546875, 1.1689453125, 1.22052001953125, 1.2720947265625, 1.32366943359375, 1.375244140625, 1.42681884765625, 1.4783935546875, 1.52996826171875, 1.58154296875, 1.63311767578125, 1.6846923828125, 1.73626708984375, 1.787841796875, 1.83941650390625, 1.8909912109375, 1.94256591796875, 1.994140625]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 5.0, 2.0, 4.0, 9.0, 16.0, 20.0, 29.0, 37.0, 46.0, 52.0, 54.0, 59.0, 83.0, 80.0, 78.0, 73.0, 67.0, 67.0, 55.0, 48.0, 35.0, 19.0, 23.0, 11.0, 12.0, 8.0, 2.0, 4.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.99365234375, -0.9523696899414062, -0.9110870361328125, -0.8698043823242188, -0.828521728515625, -0.7872390747070312, -0.7459564208984375, -0.7046737670898438, -0.66339111328125, -0.6221084594726562, -0.5808258056640625, -0.5395431518554688, -0.498260498046875, -0.45697784423828125, -0.4156951904296875, -0.37441253662109375, -0.3331298828125, -0.29184722900390625, -0.2505645751953125, -0.20928192138671875, -0.167999267578125, -0.12671661376953125, -0.0854339599609375, -0.04415130615234375, -0.00286865234375, 0.03841400146484375, 0.0796966552734375, 0.12097930908203125, 0.162261962890625, 0.20354461669921875, 0.2448272705078125, 0.28610992431640625, 0.327392578125, 0.36867523193359375, 0.4099578857421875, 0.45124053955078125, 0.492523193359375, 0.5338058471679688, 0.5750885009765625, 0.6163711547851562, 0.65765380859375, 0.6989364624023438, 0.7402191162109375, 0.7815017700195312, 0.822784423828125, 0.8640670776367188, 0.9053497314453125, 0.9466323852539062, 0.9879150390625, 1.0291976928710938, 1.0704803466796875, 1.1117630004882812, 1.153045654296875, 1.1943283081054688, 1.2356109619140625, 1.2768936157226562, 1.31817626953125, 1.3594589233398438, 1.4007415771484375, 1.4420242309570312, 1.483306884765625, 1.5245895385742188, 1.5658721923828125, 1.6071548461914062, 1.6484375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 3.0, 3.0, 8.0, 15.0, 22.0, 25.0, 38.0, 42.0, 73.0, 124.0, 243.0, 464.0, 999.0, 2495.0, 7320.0, 30758.0, 253667.0, 3533940.0, 319314.0, 32899.0, 7294.0, 2398.0, 979.0, 512.0, 246.0, 150.0, 76.0, 64.0, 28.0, 14.0, 18.0, 14.0, 9.0, 5.0, 8.0, 6.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.232421875, -2.159332275390625, -2.08624267578125, -2.013153076171875, -1.9400634765625, -1.866973876953125, -1.79388427734375, -1.720794677734375, -1.647705078125, -1.574615478515625, -1.50152587890625, -1.428436279296875, -1.3553466796875, -1.282257080078125, -1.20916748046875, -1.136077880859375, -1.06298828125, -0.989898681640625, -0.91680908203125, -0.843719482421875, -0.7706298828125, -0.697540283203125, -0.62445068359375, -0.551361083984375, -0.478271484375, -0.405181884765625, -0.33209228515625, -0.259002685546875, -0.1859130859375, -0.112823486328125, -0.03973388671875, 0.033355712890625, 0.1064453125, 0.179534912109375, 0.25262451171875, 0.325714111328125, 0.3988037109375, 0.471893310546875, 0.54498291015625, 0.618072509765625, 0.691162109375, 0.764251708984375, 0.83734130859375, 0.910430908203125, 0.9835205078125, 1.056610107421875, 1.12969970703125, 1.202789306640625, 1.27587890625, 1.348968505859375, 1.42205810546875, 1.495147705078125, 1.5682373046875, 1.641326904296875, 1.71441650390625, 1.787506103515625, 1.860595703125, 1.933685302734375, 2.00677490234375, 2.079864501953125, 2.1529541015625, 2.226043701171875, 2.29913330078125, 2.372222900390625, 2.4453125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 9.0, 7.0, 5.0, 13.0, 25.0, 23.0, 43.0, 59.0, 100.0, 164.0, 315.0, 711.0, 1014.0, 737.0, 376.0, 178.0, 110.0, 69.0, 40.0, 26.0, 12.0, 9.0, 3.0, 5.0, 3.0, 8.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-3.189453125, -3.09735107421875, -3.0052490234375, -2.91314697265625, -2.821044921875, -2.72894287109375, -2.6368408203125, -2.54473876953125, -2.45263671875, -2.36053466796875, -2.2684326171875, -2.17633056640625, -2.084228515625, -1.99212646484375, -1.9000244140625, -1.80792236328125, -1.7158203125, -1.62371826171875, -1.5316162109375, -1.43951416015625, -1.347412109375, -1.25531005859375, -1.1632080078125, -1.07110595703125, -0.97900390625, -0.88690185546875, -0.7947998046875, -0.70269775390625, -0.610595703125, -0.51849365234375, -0.4263916015625, -0.33428955078125, -0.2421875, -0.15008544921875, -0.0579833984375, 0.03411865234375, 0.126220703125, 0.21832275390625, 0.3104248046875, 0.40252685546875, 0.49462890625, 0.58673095703125, 0.6788330078125, 0.77093505859375, 0.863037109375, 0.95513916015625, 1.0472412109375, 1.13934326171875, 1.2314453125, 1.32354736328125, 1.4156494140625, 1.50775146484375, 1.599853515625, 1.69195556640625, 1.7840576171875, 1.87615966796875, 1.96826171875, 2.06036376953125, 2.1524658203125, 2.24456787109375, 2.336669921875, 2.42877197265625, 2.5208740234375, 2.61297607421875, 2.705078125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 3.0, 4.0, 9.0, 13.0, 22.0, 33.0, 109.0, 202.0, 257.0, 173.0, 105.0, 37.0, 15.0, 5.0, 1.0, 3.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.569122314453125, -23.75977325439453, -22.950424194335938, -22.141075134277344, -21.33172607421875, -20.522377014160156, -19.71302604675293, -18.903676986694336, -18.094327926635742, -17.28497886657715, -16.475629806518555, -15.666279792785645, -14.85693073272705, -14.047581672668457, -13.238231658935547, -12.428882598876953, -11.61953353881836, -10.810184478759766, -10.000835418701172, -9.191485404968262, -8.382136344909668, -7.572787284851074, -6.763437747955322, -5.95408821105957, -5.144739151000977, -4.335390090942383, -3.526040554046631, -2.716691255569458, -1.9073419570922852, -1.0979928970336914, -0.28864336013793945, 0.5207061767578125, 1.330057144165039, 2.139406442642212, 2.9487557411193848, 3.7581050395965576, 4.5674543380737305, 5.376803398132324, 6.186152935028076, 6.995502471923828, 7.804851531982422, 8.614200592041016, 9.42354965209961, 10.23289966583252, 11.042248725891113, 11.851597785949707, 12.660947799682617, 13.470296859741211, 14.279645919799805, 15.088994979858398, 15.898344039916992, 16.707693099975586, 17.517044067382812, 18.326393127441406, 19.1357421875, 19.945091247558594, 20.754440307617188, 21.56378936767578, 22.373138427734375, 23.18248748779297, 23.991836547851562, 24.801185607910156, 25.610536575317383, 26.419885635375977, 27.22923469543457]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 4.0, 2.0, 9.0, 5.0, 10.0, 14.0, 16.0, 16.0, 14.0, 15.0, 28.0, 20.0, 32.0, 26.0, 28.0, 37.0, 38.0, 40.0, 48.0, 43.0, 38.0, 51.0, 49.0, 45.0, 48.0, 39.0, 36.0, 35.0, 29.0, 27.0, 36.0, 26.0, 19.0, 15.0, 15.0, 10.0, 7.0, 6.0, 4.0, 3.0, 4.0, 4.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.81758975982666, -10.494715690612793, -10.17184066772461, -9.848966598510742, -9.526092529296875, -9.203218460083008, -8.880343437194824, -8.557469367980957, -8.23459529876709, -7.9117207527160645, -7.588846683502197, -7.265972137451172, -6.943098068237305, -6.620223522186279, -6.297348976135254, -5.974474906921387, -5.651600360870361, -5.328725814819336, -5.005851745605469, -4.682977199554443, -4.360103130340576, -4.037228584289551, -3.7143542766571045, -3.391479969024658, -3.068605661392212, -2.7457313537597656, -2.4228570461273193, -2.099982738494873, -1.7771083116531372, -1.454234004020691, -1.131359577178955, -0.8084852695465088, -0.4856109619140625, -0.16273662447929382, 0.16013771295547485, 0.4830120801925659, 0.8058863878250122, 1.1287606954574585, 1.4516351222991943, 1.7745094299316406, 2.097383737564087, 2.420258045196533, 2.7431323528289795, 3.066006660461426, 3.388881206512451, 3.7117552757263184, 4.034629821777344, 4.357503890991211, 4.680378437042236, 5.003252983093262, 5.326127052307129, 5.649001598358154, 5.9718756675720215, 6.294750213623047, 6.617624282836914, 6.9404988288879395, 7.263373374938965, 7.58624792098999, 7.909121990203857, 8.231996536254883, 8.55487060546875, 8.877744674682617, 9.2006196975708, 9.523493766784668, 9.846367835998535]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 7.0, 6.0, 11.0, 12.0, 19.0, 26.0, 65.0, 90.0, 165.0, 246.0, 422.0, 742.0, 1656.0, 3257.0, 7405.0, 17309.0, 42954.0, 106416.0, 234440.0, 311552.0, 185660.0, 80064.0, 31923.0, 13000.0, 5614.0, 2630.0, 1261.0, 695.0, 371.0, 208.0, 134.0, 64.0, 57.0, 34.0, 17.0, 9.0, 7.0, 3.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3076171875, -1.267181396484375, -1.22674560546875, -1.186309814453125, -1.1458740234375, -1.105438232421875, -1.06500244140625, -1.024566650390625, -0.984130859375, -0.943695068359375, -0.90325927734375, -0.862823486328125, -0.8223876953125, -0.781951904296875, -0.74151611328125, -0.701080322265625, -0.66064453125, -0.620208740234375, -0.57977294921875, -0.539337158203125, -0.4989013671875, -0.458465576171875, -0.41802978515625, -0.377593994140625, -0.337158203125, -0.296722412109375, -0.25628662109375, -0.215850830078125, -0.1754150390625, -0.134979248046875, -0.09454345703125, -0.054107666015625, -0.013671875, 0.026763916015625, 0.06719970703125, 0.107635498046875, 0.1480712890625, 0.188507080078125, 0.22894287109375, 0.269378662109375, 0.309814453125, 0.350250244140625, 0.39068603515625, 0.431121826171875, 0.4715576171875, 0.511993408203125, 0.55242919921875, 0.592864990234375, 0.63330078125, 0.673736572265625, 0.71417236328125, 0.754608154296875, 0.7950439453125, 0.835479736328125, 0.87591552734375, 0.916351318359375, 0.956787109375, 0.997222900390625, 1.03765869140625, 1.078094482421875, 1.1185302734375, 1.158966064453125, 1.19940185546875, 1.239837646484375, 1.2802734375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 0.0, 3.0, 3.0, 1.0, 6.0, 13.0, 10.0, 14.0, 13.0, 19.0, 32.0, 21.0, 55.0, 39.0, 42.0, 54.0, 49.0, 58.0, 61.0, 67.0, 55.0, 51.0, 55.0, 45.0, 35.0, 35.0, 30.0, 32.0, 22.0, 19.0, 12.0, 16.0, 7.0, 9.0, 5.0, 7.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-1.0615234375, -1.0304412841796875, -0.999359130859375, -0.9682769775390625, -0.93719482421875, -0.9061126708984375, -0.875030517578125, -0.8439483642578125, -0.8128662109375, -0.7817840576171875, -0.750701904296875, -0.7196197509765625, -0.68853759765625, -0.6574554443359375, -0.626373291015625, -0.5952911376953125, -0.564208984375, -0.5331268310546875, -0.502044677734375, -0.4709625244140625, -0.43988037109375, -0.4087982177734375, -0.377716064453125, -0.3466339111328125, -0.3155517578125, -0.2844696044921875, -0.253387451171875, -0.2223052978515625, -0.19122314453125, -0.1601409912109375, -0.129058837890625, -0.0979766845703125, -0.06689453125, -0.0358123779296875, -0.004730224609375, 0.0263519287109375, 0.05743408203125, 0.0885162353515625, 0.119598388671875, 0.1506805419921875, 0.1817626953125, 0.2128448486328125, 0.243927001953125, 0.2750091552734375, 0.30609130859375, 0.3371734619140625, 0.368255615234375, 0.3993377685546875, 0.430419921875, 0.4615020751953125, 0.492584228515625, 0.5236663818359375, 0.55474853515625, 0.5858306884765625, 0.616912841796875, 0.6479949951171875, 0.6790771484375, 0.7101593017578125, 0.741241455078125, 0.7723236083984375, 0.80340576171875, 0.8344879150390625, 0.865570068359375, 0.8966522216796875, 0.927734375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 6.0, 3.0, 7.0, 8.0, 14.0, 14.0, 24.0, 37.0, 40.0, 59.0, 106.0, 128.0, 183.0, 263.0, 377.0, 586.0, 1020.0, 2016.0, 5548.0, 26407.0, 253199.0, 672252.0, 69672.0, 10071.0, 2979.0, 1276.0, 720.0, 457.0, 305.0, 186.0, 149.0, 127.0, 77.0, 63.0, 54.0, 30.0, 23.0, 16.0, 11.0, 15.0, 12.0, 10.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0], "bins": [-3.125, -3.03094482421875, -2.9368896484375, -2.84283447265625, -2.748779296875, -2.65472412109375, -2.5606689453125, -2.46661376953125, -2.37255859375, -2.27850341796875, -2.1844482421875, -2.09039306640625, -1.996337890625, -1.90228271484375, -1.8082275390625, -1.71417236328125, -1.6201171875, -1.52606201171875, -1.4320068359375, -1.33795166015625, -1.243896484375, -1.14984130859375, -1.0557861328125, -0.96173095703125, -0.86767578125, -0.77362060546875, -0.6795654296875, -0.58551025390625, -0.491455078125, -0.39739990234375, -0.3033447265625, -0.20928955078125, -0.115234375, -0.02117919921875, 0.0728759765625, 0.16693115234375, 0.260986328125, 0.35504150390625, 0.4490966796875, 0.54315185546875, 0.63720703125, 0.73126220703125, 0.8253173828125, 0.91937255859375, 1.013427734375, 1.10748291015625, 1.2015380859375, 1.29559326171875, 1.3896484375, 1.48370361328125, 1.5777587890625, 1.67181396484375, 1.765869140625, 1.85992431640625, 1.9539794921875, 2.04803466796875, 2.14208984375, 2.23614501953125, 2.3302001953125, 2.42425537109375, 2.518310546875, 2.61236572265625, 2.7064208984375, 2.80047607421875, 2.89453125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 9.0, 6.0, 10.0, 12.0, 14.0, 7.0, 11.0, 13.0, 31.0, 25.0, 41.0, 31.0, 37.0, 47.0, 37.0, 30.0, 47.0, 42.0, 53.0, 41.0, 41.0, 31.0, 39.0, 32.0, 37.0, 37.0, 26.0, 41.0, 22.0, 22.0, 18.0, 19.0, 15.0, 11.0, 5.0, 11.0, 10.0, 7.0, 7.0, 6.0, 5.0, 2.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0], "bins": [-3.427734375, -3.32080078125, -3.2138671875, -3.10693359375, -3.0, -2.89306640625, -2.7861328125, -2.67919921875, -2.572265625, -2.46533203125, -2.3583984375, -2.25146484375, -2.14453125, -2.03759765625, -1.9306640625, -1.82373046875, -1.716796875, -1.60986328125, -1.5029296875, -1.39599609375, -1.2890625, -1.18212890625, -1.0751953125, -0.96826171875, -0.861328125, -0.75439453125, -0.6474609375, -0.54052734375, -0.43359375, -0.32666015625, -0.2197265625, -0.11279296875, -0.005859375, 0.10107421875, 0.2080078125, 0.31494140625, 0.421875, 0.52880859375, 0.6357421875, 0.74267578125, 0.849609375, 0.95654296875, 1.0634765625, 1.17041015625, 1.27734375, 1.38427734375, 1.4912109375, 1.59814453125, 1.705078125, 1.81201171875, 1.9189453125, 2.02587890625, 2.1328125, 2.23974609375, 2.3466796875, 2.45361328125, 2.560546875, 2.66748046875, 2.7744140625, 2.88134765625, 2.98828125, 3.09521484375, 3.2021484375, 3.30908203125, 3.416015625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 1.0, 2.0, 2.0, 3.0, 5.0, 2.0, 9.0, 27.0, 42.0, 75.0, 222.0, 536.0, 2536.0, 41220.0, 941287.0, 58537.0, 3031.0, 645.0, 206.0, 80.0, 35.0, 19.0, 11.0, 5.0, 7.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.638671875, -1.58502197265625, -1.5313720703125, -1.47772216796875, -1.424072265625, -1.37042236328125, -1.3167724609375, -1.26312255859375, -1.20947265625, -1.15582275390625, -1.1021728515625, -1.04852294921875, -0.994873046875, -0.94122314453125, -0.8875732421875, -0.83392333984375, -0.7802734375, -0.72662353515625, -0.6729736328125, -0.61932373046875, -0.565673828125, -0.51202392578125, -0.4583740234375, -0.40472412109375, -0.35107421875, -0.29742431640625, -0.2437744140625, -0.19012451171875, -0.136474609375, -0.08282470703125, -0.0291748046875, 0.02447509765625, 0.078125, 0.13177490234375, 0.1854248046875, 0.23907470703125, 0.292724609375, 0.34637451171875, 0.4000244140625, 0.45367431640625, 0.50732421875, 0.56097412109375, 0.6146240234375, 0.66827392578125, 0.721923828125, 0.77557373046875, 0.8292236328125, 0.88287353515625, 0.9365234375, 0.99017333984375, 1.0438232421875, 1.09747314453125, 1.151123046875, 1.20477294921875, 1.2584228515625, 1.31207275390625, 1.36572265625, 1.41937255859375, 1.4730224609375, 1.52667236328125, 1.580322265625, 1.63397216796875, 1.6876220703125, 1.74127197265625, 1.794921875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 9.0, 9.0, 25.0, 17.0, 27.0, 47.0, 47.0, 92.0, 130.0, 117.0, 134.0, 94.0, 68.0, 49.0, 37.0, 24.0, 23.0, 17.0, 12.0, 4.0, 8.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0003330707550048828, -0.00032491981983184814, -0.0003167688846588135, -0.0003086179494857788, -0.00030046701431274414, -0.00029231607913970947, -0.0002841651439666748, -0.00027601420879364014, -0.00026786327362060547, -0.0002597123384475708, -0.00025156140327453613, -0.00024341046810150146, -0.0002352595329284668, -0.00022710859775543213, -0.00021895766258239746, -0.0002108067274093628, -0.00020265579223632812, -0.00019450485706329346, -0.0001863539218902588, -0.00017820298671722412, -0.00017005205154418945, -0.00016190111637115479, -0.00015375018119812012, -0.00014559924602508545, -0.00013744831085205078, -0.0001292973756790161, -0.00012114644050598145, -0.00011299550533294678, -0.00010484457015991211, -9.669363498687744e-05, -8.854269981384277e-05, -8.03917646408081e-05, -7.224082946777344e-05, -6.408989429473877e-05, -5.59389591217041e-05, -4.7788023948669434e-05, -3.9637088775634766e-05, -3.14861536026001e-05, -2.333521842956543e-05, -1.5184283256530762e-05, -7.033348083496094e-06, 1.1175870895385742e-06, 9.268522262573242e-06, 1.741945743560791e-05, 2.5570392608642578e-05, 3.3721327781677246e-05, 4.1872262954711914e-05, 5.002319812774658e-05, 5.817413330078125e-05, 6.632506847381592e-05, 7.447600364685059e-05, 8.262693881988525e-05, 9.077787399291992e-05, 9.892880916595459e-05, 0.00010707974433898926, 0.00011523067951202393, 0.0001233816146850586, 0.00013153254985809326, 0.00013968348503112793, 0.0001478344202041626, 0.00015598535537719727, 0.00016413629055023193, 0.0001722872257232666, 0.00018043816089630127, 0.00018858909606933594]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 7.0, 9.0, 17.0, 17.0, 36.0, 53.0, 108.0, 217.0, 429.0, 977.0, 2664.0, 13423.0, 196161.0, 778581.0, 47242.0, 5775.0, 1572.0, 599.0, 297.0, 161.0, 85.0, 57.0, 20.0, 24.0, 8.0, 8.0, 3.0, 2.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3173828125, -1.2838287353515625, -1.250274658203125, -1.2167205810546875, -1.18316650390625, -1.1496124267578125, -1.116058349609375, -1.0825042724609375, -1.0489501953125, -1.0153961181640625, -0.981842041015625, -0.9482879638671875, -0.91473388671875, -0.8811798095703125, -0.847625732421875, -0.8140716552734375, -0.780517578125, -0.7469635009765625, -0.713409423828125, -0.6798553466796875, -0.64630126953125, -0.6127471923828125, -0.579193115234375, -0.5456390380859375, -0.5120849609375, -0.4785308837890625, -0.444976806640625, -0.4114227294921875, -0.37786865234375, -0.3443145751953125, -0.310760498046875, -0.2772064208984375, -0.24365234375, -0.2100982666015625, -0.176544189453125, -0.1429901123046875, -0.10943603515625, -0.0758819580078125, -0.042327880859375, -0.0087738037109375, 0.0247802734375, 0.0583343505859375, 0.091888427734375, 0.1254425048828125, 0.15899658203125, 0.1925506591796875, 0.226104736328125, 0.2596588134765625, 0.293212890625, 0.3267669677734375, 0.360321044921875, 0.3938751220703125, 0.42742919921875, 0.4609832763671875, 0.494537353515625, 0.5280914306640625, 0.5616455078125, 0.5951995849609375, 0.628753662109375, 0.6623077392578125, 0.69586181640625, 0.7294158935546875, 0.762969970703125, 0.7965240478515625, 0.830078125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 3.0, 5.0, 8.0, 4.0, 10.0, 9.0, 10.0, 17.0, 21.0, 31.0, 39.0, 34.0, 41.0, 55.0, 72.0, 66.0, 63.0, 75.0, 59.0, 59.0, 55.0, 46.0, 44.0, 35.0, 34.0, 18.0, 16.0, 15.0, 12.0, 8.0, 4.0, 10.0, 4.0, 8.0, 2.0, 7.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.68603515625, -0.6647186279296875, -0.643402099609375, -0.6220855712890625, -0.60076904296875, -0.5794525146484375, -0.558135986328125, -0.5368194580078125, -0.5155029296875, -0.4941864013671875, -0.472869873046875, -0.4515533447265625, -0.43023681640625, -0.4089202880859375, -0.387603759765625, -0.3662872314453125, -0.344970703125, -0.3236541748046875, -0.302337646484375, -0.2810211181640625, -0.25970458984375, -0.2383880615234375, -0.217071533203125, -0.1957550048828125, -0.1744384765625, -0.1531219482421875, -0.131805419921875, -0.1104888916015625, -0.08917236328125, -0.0678558349609375, -0.046539306640625, -0.0252227783203125, -0.00390625, 0.0174102783203125, 0.038726806640625, 0.0600433349609375, 0.08135986328125, 0.1026763916015625, 0.123992919921875, 0.1453094482421875, 0.1666259765625, 0.1879425048828125, 0.209259033203125, 0.2305755615234375, 0.25189208984375, 0.2732086181640625, 0.294525146484375, 0.3158416748046875, 0.337158203125, 0.3584747314453125, 0.379791259765625, 0.4011077880859375, 0.42242431640625, 0.4437408447265625, 0.465057373046875, 0.4863739013671875, 0.5076904296875, 0.5290069580078125, 0.550323486328125, 0.5716400146484375, 0.59295654296875, 0.6142730712890625, 0.635589599609375, 0.6569061279296875, 0.67822265625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 7.0, 6.0, 7.0, 11.0, 29.0, 33.0, 90.0, 154.0, 215.0, 213.0, 117.0, 55.0, 39.0, 10.0, 7.0, 6.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.04113006591797, -19.432435989379883, -18.823741912841797, -18.215045928955078, -17.606351852416992, -16.997657775878906, -16.38896369934082, -15.780268669128418, -15.171573638916016, -14.56287956237793, -13.954184532165527, -13.345490455627441, -12.736795425415039, -12.128101348876953, -11.519407272338867, -10.910712242126465, -10.302018165588379, -9.693324089050293, -9.08462905883789, -8.475934982299805, -7.867239952087402, -7.258545875549316, -6.649851322174072, -6.041156768798828, -5.432462215423584, -4.82376766204834, -4.215073108673096, -3.6063787937164307, -2.9976842403411865, -2.3889896869659424, -1.7802953720092773, -1.1716008186340332, -0.5629062652587891, 0.0457882285118103, 0.6544827222824097, 1.2631771564483643, 1.8718717098236084, 2.4805662631988525, 3.0892605781555176, 3.6979551315307617, 4.306649684906006, 4.91534423828125, 5.524038791656494, 6.132733345031738, 6.741427421569824, 7.350122451782227, 7.9588165283203125, 8.567510604858398, 9.1762056350708, 9.784899711608887, 10.393594741821289, 11.002288818359375, 11.610983848571777, 12.219677925109863, 12.828372955322266, 13.437067031860352, 14.045761108398438, 14.654455184936523, 15.263150215148926, 15.871844291687012, 16.480539321899414, 17.0892333984375, 17.697927474975586, 18.306621551513672, 18.91531753540039]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 2.0, 0.0, 4.0, 6.0, 8.0, 18.0, 11.0, 24.0, 21.0, 32.0, 42.0, 37.0, 33.0, 71.0, 60.0, 89.0, 116.0, 74.0, 64.0, 43.0, 50.0, 56.0, 32.0, 32.0, 23.0, 14.0, 11.0, 11.0, 8.0, 4.0, 3.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-26.731983184814453, -26.08621597290039, -25.440446853637695, -24.794679641723633, -24.14891242980957, -23.503145217895508, -22.857376098632812, -22.21160888671875, -21.565841674804688, -20.920074462890625, -20.27430534362793, -19.628538131713867, -18.982770919799805, -18.337003707885742, -17.691234588623047, -17.045467376708984, -16.399700164794922, -15.753931999206543, -15.10816478729248, -14.462396621704102, -13.816629409790039, -13.17086124420166, -12.525093078613281, -11.879325866699219, -11.233556747436523, -10.587788581848145, -9.942021369934082, -9.296253204345703, -8.65048599243164, -8.004717826843262, -7.358950138092041, -6.71318244934082, -6.067415237426758, -5.421647548675537, -4.775879859924316, -4.1301116943359375, -3.484344244003296, -2.838576555252075, -2.1928086280822754, -1.5470409393310547, -0.901273250579834, -0.2555055022239685, 0.390262246131897, 1.0360300540924072, 1.681797742843628, 2.3275654315948486, 2.9733333587646484, 3.619101047515869, 4.26486873626709, 4.9106364250183105, 5.556404113769531, 6.20217227935791, 6.847939491271973, 7.493707656860352, 8.139474868774414, 8.785243034362793, 9.431011199951172, 10.07677936553955, 10.722546577453613, 11.368314743041992, 12.014081954956055, 12.659850120544434, 13.305618286132812, 13.951385498046875, 14.597152709960938]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 4.0, 2.0, 6.0, 5.0, 7.0, 8.0, 12.0, 17.0, 13.0, 29.0, 57.0, 90.0, 141.0, 304.0, 548.0, 1106.0, 2600.0, 7023.0, 24979.0, 126243.0, 919856.0, 2500677.0, 503236.0, 77142.0, 18822.0, 6155.0, 2586.0, 1265.0, 633.0, 352.0, 174.0, 88.0, 42.0, 32.0, 8.0, 13.0, 9.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.3505859375, -1.3171234130859375, -1.283660888671875, -1.2501983642578125, -1.21673583984375, -1.1832733154296875, -1.149810791015625, -1.1163482666015625, -1.0828857421875, -1.0494232177734375, -1.015960693359375, -0.9824981689453125, -0.94903564453125, -0.9155731201171875, -0.882110595703125, -0.8486480712890625, -0.815185546875, -0.7817230224609375, -0.748260498046875, -0.7147979736328125, -0.68133544921875, -0.6478729248046875, -0.614410400390625, -0.5809478759765625, -0.5474853515625, -0.5140228271484375, -0.480560302734375, -0.4470977783203125, -0.41363525390625, -0.3801727294921875, -0.346710205078125, -0.3132476806640625, -0.27978515625, -0.2463226318359375, -0.212860107421875, -0.1793975830078125, -0.14593505859375, -0.1124725341796875, -0.079010009765625, -0.0455474853515625, -0.0120849609375, 0.0213775634765625, 0.054840087890625, 0.0883026123046875, 0.12176513671875, 0.1552276611328125, 0.188690185546875, 0.2221527099609375, 0.255615234375, 0.2890777587890625, 0.322540283203125, 0.3560028076171875, 0.38946533203125, 0.4229278564453125, 0.456390380859375, 0.4898529052734375, 0.5233154296875, 0.5567779541015625, 0.590240478515625, 0.6237030029296875, 0.65716552734375, 0.6906280517578125, 0.724090576171875, 0.7575531005859375, 0.791015625]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 3.0, 5.0, 9.0, 15.0, 24.0, 43.0, 51.0, 71.0, 88.0, 88.0, 106.0, 105.0, 99.0, 85.0, 53.0, 45.0, 36.0, 25.0, 19.0, 11.0, 11.0, 3.0, 6.0, 4.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.4375, -2.3855438232421875, -2.333587646484375, -2.2816314697265625, -2.22967529296875, -2.1777191162109375, -2.125762939453125, -2.0738067626953125, -2.0218505859375, -1.9698944091796875, -1.917938232421875, -1.8659820556640625, -1.81402587890625, -1.7620697021484375, -1.710113525390625, -1.6581573486328125, -1.606201171875, -1.5542449951171875, -1.502288818359375, -1.4503326416015625, -1.39837646484375, -1.3464202880859375, -1.294464111328125, -1.2425079345703125, -1.1905517578125, -1.1385955810546875, -1.086639404296875, -1.0346832275390625, -0.98272705078125, -0.9307708740234375, -0.878814697265625, -0.8268585205078125, -0.77490234375, -0.7229461669921875, -0.670989990234375, -0.6190338134765625, -0.56707763671875, -0.5151214599609375, -0.463165283203125, -0.4112091064453125, -0.3592529296875, -0.3072967529296875, -0.255340576171875, -0.2033843994140625, -0.15142822265625, -0.0994720458984375, -0.047515869140625, 0.0044403076171875, 0.056396484375, 0.1083526611328125, 0.160308837890625, 0.2122650146484375, 0.26422119140625, 0.3161773681640625, 0.368133544921875, 0.4200897216796875, 0.4720458984375, 0.5240020751953125, 0.575958251953125, 0.6279144287109375, 0.67987060546875, 0.7318267822265625, 0.783782958984375, 0.8357391357421875, 0.8876953125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 4.0, 10.0, 10.0, 12.0, 20.0, 31.0, 50.0, 84.0, 156.0, 248.0, 449.0, 1015.0, 2702.0, 7728.0, 29591.0, 186522.0, 2978607.0, 879457.0, 80889.0, 17803.0, 5165.0, 1895.0, 808.0, 421.0, 218.0, 150.0, 73.0, 53.0, 36.0, 24.0, 19.0, 13.0, 6.0, 5.0, 6.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.71875, -1.6693115234375, -1.619873046875, -1.5704345703125, -1.52099609375, -1.4715576171875, -1.422119140625, -1.3726806640625, -1.3232421875, -1.2738037109375, -1.224365234375, -1.1749267578125, -1.12548828125, -1.0760498046875, -1.026611328125, -0.9771728515625, -0.927734375, -0.8782958984375, -0.828857421875, -0.7794189453125, -0.72998046875, -0.6805419921875, -0.631103515625, -0.5816650390625, -0.5322265625, -0.4827880859375, -0.433349609375, -0.3839111328125, -0.33447265625, -0.2850341796875, -0.235595703125, -0.1861572265625, -0.13671875, -0.0872802734375, -0.037841796875, 0.0115966796875, 0.06103515625, 0.1104736328125, 0.159912109375, 0.2093505859375, 0.2587890625, 0.3082275390625, 0.357666015625, 0.4071044921875, 0.45654296875, 0.5059814453125, 0.555419921875, 0.6048583984375, 0.654296875, 0.7037353515625, 0.753173828125, 0.8026123046875, 0.85205078125, 0.9014892578125, 0.950927734375, 1.0003662109375, 1.0498046875, 1.0992431640625, 1.148681640625, 1.1981201171875, 1.24755859375, 1.2969970703125, 1.346435546875, 1.3958740234375, 1.4453125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 7.0, 5.0, 15.0, 14.0, 17.0, 26.0, 24.0, 63.0, 101.0, 121.0, 265.0, 442.0, 686.0, 775.0, 589.0, 305.0, 191.0, 139.0, 74.0, 34.0, 38.0, 43.0, 31.0, 18.0, 10.0, 10.0, 8.0, 4.0, 8.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.9130859375, -1.8517913818359375, -1.790496826171875, -1.7292022705078125, -1.66790771484375, -1.6066131591796875, -1.545318603515625, -1.4840240478515625, -1.4227294921875, -1.3614349365234375, -1.300140380859375, -1.2388458251953125, -1.17755126953125, -1.1162567138671875, -1.054962158203125, -0.9936676025390625, -0.932373046875, -0.8710784912109375, -0.809783935546875, -0.7484893798828125, -0.68719482421875, -0.6259002685546875, -0.564605712890625, -0.5033111572265625, -0.4420166015625, -0.3807220458984375, -0.319427490234375, -0.2581329345703125, -0.19683837890625, -0.1355438232421875, -0.074249267578125, -0.0129547119140625, 0.04833984375, 0.1096343994140625, 0.170928955078125, 0.2322235107421875, 0.29351806640625, 0.3548126220703125, 0.416107177734375, 0.4774017333984375, 0.5386962890625, 0.5999908447265625, 0.661285400390625, 0.7225799560546875, 0.78387451171875, 0.8451690673828125, 0.906463623046875, 0.9677581787109375, 1.029052734375, 1.0903472900390625, 1.151641845703125, 1.2129364013671875, 1.27423095703125, 1.3355255126953125, 1.396820068359375, 1.4581146240234375, 1.5194091796875, 1.5807037353515625, 1.641998291015625, 1.7032928466796875, 1.76458740234375, 1.8258819580078125, 1.887176513671875, 1.9484710693359375, 2.009765625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 5.0, 31.0, 217.0, 438.0, 233.0, 53.0, 10.0, 10.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.59027099609375, -34.2432746887207, -32.896278381347656, -31.549283981323242, -30.202289581298828, -28.85529327392578, -27.508296966552734, -26.16130256652832, -24.814308166503906, -23.46731185913086, -22.120317459106445, -20.7733211517334, -19.426326751708984, -18.079330444335938, -16.73233413696289, -15.385339736938477, -14.03834342956543, -12.6913480758667, -11.344352722167969, -9.997356414794922, -8.650362014770508, -7.303366184234619, -5.9563703536987305, -4.609375, -3.2623796463012695, -1.9153841733932495, -0.5683887004852295, 0.7786068916320801, 2.1256022453308105, 3.472597599029541, 4.81959342956543, 6.16658878326416, 7.513584136962891, 8.860579490661621, 10.207574844360352, 11.554571151733398, 12.901565551757812, 14.24856185913086, 15.59555721282959, 16.94255256652832, 18.289546966552734, 19.63654327392578, 20.983537673950195, 22.330533981323242, 23.677528381347656, 25.024524688720703, 26.37152099609375, 27.718515396118164, 29.06551170349121, 30.412508010864258, 31.759502410888672, 33.10649871826172, 34.453495025634766, 35.80048751831055, 37.147483825683594, 38.49448013305664, 39.84147644042969, 41.188472747802734, 42.53546905517578, 43.88246154785156, 45.22945785522461, 46.576454162597656, 47.9234504699707, 49.27044677734375, 50.61743927001953]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 3.0, 1.0, 11.0, 4.0, 6.0, 9.0, 13.0, 12.0, 24.0, 30.0, 37.0, 46.0, 53.0, 68.0, 45.0, 62.0, 78.0, 44.0, 65.0, 64.0, 53.0, 38.0, 49.0, 37.0, 36.0, 22.0, 25.0, 27.0, 10.0, 14.0, 8.0, 3.0, 2.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.546370506286621, -11.097363471984863, -10.648356437683105, -10.199349403381348, -9.750341415405273, -9.301334381103516, -8.852327346801758, -8.4033203125, -7.954313278198242, -7.505306243896484, -7.056299209594727, -6.6072916984558105, -6.158284664154053, -5.709277629852295, -5.260270118713379, -4.811263084411621, -4.362256050109863, -3.9132490158081055, -3.4642417430877686, -3.0152344703674316, -2.566227436065674, -2.117220401763916, -1.668213129043579, -1.2192058563232422, -0.7701988220214844, -0.321191668510437, 0.12781548500061035, 0.5768226385116577, 1.025829792022705, 1.474836826324463, 1.9238440990447998, 2.3728513717651367, 2.821859359741211, 3.2708663940429688, 3.7198736667633057, 4.168880939483643, 4.6178879737854, 5.066895008087158, 5.515902519226074, 5.964909553527832, 6.41391658782959, 6.862923622131348, 7.3119306564331055, 7.7609381675720215, 8.209945678710938, 8.658952713012695, 9.107959747314453, 9.556966781616211, 10.005973815917969, 10.454980850219727, 10.903987884521484, 11.352994918823242, 11.802001953125, 12.251008987426758, 12.700016975402832, 13.14902400970459, 13.598031044006348, 14.047038078308105, 14.496045112609863, 14.945052146911621, 15.394060134887695, 15.843067169189453, 16.29207420349121, 16.74108123779297, 17.190088272094727]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 12.0, 21.0, 29.0, 35.0, 68.0, 127.0, 203.0, 416.0, 675.0, 1341.0, 2549.0, 5086.0, 10830.0, 24784.0, 56589.0, 131326.0, 269742.0, 285153.0, 145975.0, 63145.0, 26937.0, 12056.0, 5513.0, 2769.0, 1354.0, 811.0, 437.0, 221.0, 142.0, 74.0, 49.0, 40.0, 10.0, 7.0, 9.0, 6.0, 8.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0751953125, -1.0368804931640625, -0.998565673828125, -0.9602508544921875, -0.92193603515625, -0.8836212158203125, -0.845306396484375, -0.8069915771484375, -0.7686767578125, -0.7303619384765625, -0.692047119140625, -0.6537322998046875, -0.61541748046875, -0.5771026611328125, -0.538787841796875, -0.5004730224609375, -0.462158203125, -0.4238433837890625, -0.385528564453125, -0.3472137451171875, -0.30889892578125, -0.2705841064453125, -0.232269287109375, -0.1939544677734375, -0.1556396484375, -0.1173248291015625, -0.079010009765625, -0.0406951904296875, -0.00238037109375, 0.0359344482421875, 0.074249267578125, 0.1125640869140625, 0.15087890625, 0.1891937255859375, 0.227508544921875, 0.2658233642578125, 0.30413818359375, 0.3424530029296875, 0.380767822265625, 0.4190826416015625, 0.4573974609375, 0.4957122802734375, 0.534027099609375, 0.5723419189453125, 0.61065673828125, 0.6489715576171875, 0.687286376953125, 0.7256011962890625, 0.763916015625, 0.8022308349609375, 0.840545654296875, 0.8788604736328125, 0.91717529296875, 0.9554901123046875, 0.993804931640625, 1.0321197509765625, 1.0704345703125, 1.1087493896484375, 1.147064208984375, 1.1853790283203125, 1.22369384765625, 1.2620086669921875, 1.300323486328125, 1.3386383056640625, 1.376953125]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 5.0, 3.0, 5.0, 4.0, 10.0, 14.0, 14.0, 18.0, 22.0, 27.0, 36.0, 43.0, 53.0, 46.0, 60.0, 56.0, 70.0, 45.0, 56.0, 55.0, 50.0, 60.0, 38.0, 41.0, 22.0, 33.0, 29.0, 19.0, 18.0, 7.0, 9.0, 9.0, 5.0, 8.0, 4.0, 3.0, 6.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.0458984375, -1.0156402587890625, -0.985382080078125, -0.9551239013671875, -0.92486572265625, -0.8946075439453125, -0.864349365234375, -0.8340911865234375, -0.8038330078125, -0.7735748291015625, -0.743316650390625, -0.7130584716796875, -0.68280029296875, -0.6525421142578125, -0.622283935546875, -0.5920257568359375, -0.561767578125, -0.5315093994140625, -0.501251220703125, -0.4709930419921875, -0.44073486328125, -0.4104766845703125, -0.380218505859375, -0.3499603271484375, -0.3197021484375, -0.2894439697265625, -0.259185791015625, -0.2289276123046875, -0.19866943359375, -0.1684112548828125, -0.138153076171875, -0.1078948974609375, -0.07763671875, -0.0473785400390625, -0.017120361328125, 0.0131378173828125, 0.04339599609375, 0.0736541748046875, 0.103912353515625, 0.1341705322265625, 0.1644287109375, 0.1946868896484375, 0.224945068359375, 0.2552032470703125, 0.28546142578125, 0.3157196044921875, 0.345977783203125, 0.3762359619140625, 0.406494140625, 0.4367523193359375, 0.467010498046875, 0.4972686767578125, 0.52752685546875, 0.5577850341796875, 0.588043212890625, 0.6183013916015625, 0.6485595703125, 0.6788177490234375, 0.709075927734375, 0.7393341064453125, 0.76959228515625, 0.7998504638671875, 0.830108642578125, 0.8603668212890625, 0.890625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 7.0, 7.0, 12.0, 16.0, 22.0, 35.0, 34.0, 60.0, 70.0, 105.0, 157.0, 208.0, 330.0, 503.0, 932.0, 1827.0, 4932.0, 21657.0, 181740.0, 717725.0, 97391.0, 13417.0, 3601.0, 1528.0, 786.0, 457.0, 301.0, 196.0, 137.0, 105.0, 65.0, 44.0, 35.0, 34.0, 29.0, 9.0, 12.0, 6.0, 10.0, 5.0, 3.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.5, -2.40863037109375, -2.3172607421875, -2.22589111328125, -2.134521484375, -2.04315185546875, -1.9517822265625, -1.86041259765625, -1.76904296875, -1.67767333984375, -1.5863037109375, -1.49493408203125, -1.403564453125, -1.31219482421875, -1.2208251953125, -1.12945556640625, -1.0380859375, -0.94671630859375, -0.8553466796875, -0.76397705078125, -0.672607421875, -0.58123779296875, -0.4898681640625, -0.39849853515625, -0.30712890625, -0.21575927734375, -0.1243896484375, -0.03302001953125, 0.058349609375, 0.14971923828125, 0.2410888671875, 0.33245849609375, 0.423828125, 0.51519775390625, 0.6065673828125, 0.69793701171875, 0.789306640625, 0.88067626953125, 0.9720458984375, 1.06341552734375, 1.15478515625, 1.24615478515625, 1.3375244140625, 1.42889404296875, 1.520263671875, 1.61163330078125, 1.7030029296875, 1.79437255859375, 1.8857421875, 1.97711181640625, 2.0684814453125, 2.15985107421875, 2.251220703125, 2.34259033203125, 2.4339599609375, 2.52532958984375, 2.61669921875, 2.70806884765625, 2.7994384765625, 2.89080810546875, 2.982177734375, 3.07354736328125, 3.1649169921875, 3.25628662109375, 3.34765625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 4.0, 2.0, 7.0, 4.0, 15.0, 18.0, 17.0, 24.0, 14.0, 21.0, 35.0, 24.0, 33.0, 37.0, 44.0, 38.0, 49.0, 55.0, 59.0, 41.0, 55.0, 54.0, 44.0, 43.0, 41.0, 35.0, 34.0, 31.0, 16.0, 19.0, 21.0, 16.0, 8.0, 8.0, 10.0, 7.0, 5.0, 2.0, 4.0, 3.0, 0.0, 7.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9296875, -2.828399658203125, -2.72711181640625, -2.625823974609375, -2.5245361328125, -2.423248291015625, -2.32196044921875, -2.220672607421875, -2.119384765625, -2.018096923828125, -1.91680908203125, -1.815521240234375, -1.7142333984375, -1.612945556640625, -1.51165771484375, -1.410369873046875, -1.30908203125, -1.207794189453125, -1.10650634765625, -1.005218505859375, -0.9039306640625, -0.802642822265625, -0.70135498046875, -0.600067138671875, -0.498779296875, -0.397491455078125, -0.29620361328125, -0.194915771484375, -0.0936279296875, 0.007659912109375, 0.10894775390625, 0.210235595703125, 0.3115234375, 0.412811279296875, 0.51409912109375, 0.615386962890625, 0.7166748046875, 0.817962646484375, 0.91925048828125, 1.020538330078125, 1.121826171875, 1.223114013671875, 1.32440185546875, 1.425689697265625, 1.5269775390625, 1.628265380859375, 1.72955322265625, 1.830841064453125, 1.93212890625, 2.033416748046875, 2.13470458984375, 2.235992431640625, 2.3372802734375, 2.438568115234375, 2.53985595703125, 2.641143798828125, 2.742431640625, 2.843719482421875, 2.94500732421875, 3.046295166015625, 3.1475830078125, 3.248870849609375, 3.35015869140625, 3.451446533203125, 3.552734375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 6.0, 5.0, 7.0, 6.0, 16.0, 17.0, 32.0, 36.0, 84.0, 135.0, 308.0, 809.0, 2632.0, 13474.0, 122817.0, 780671.0, 110924.0, 12663.0, 2516.0, 748.0, 330.0, 127.0, 84.0, 40.0, 19.0, 21.0, 18.0, 4.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.0185546875, -0.989013671875, -0.95947265625, -0.929931640625, -0.900390625, -0.870849609375, -0.84130859375, -0.811767578125, -0.7822265625, -0.752685546875, -0.72314453125, -0.693603515625, -0.6640625, -0.634521484375, -0.60498046875, -0.575439453125, -0.5458984375, -0.516357421875, -0.48681640625, -0.457275390625, -0.427734375, -0.398193359375, -0.36865234375, -0.339111328125, -0.3095703125, -0.280029296875, -0.25048828125, -0.220947265625, -0.19140625, -0.161865234375, -0.13232421875, -0.102783203125, -0.0732421875, -0.043701171875, -0.01416015625, 0.015380859375, 0.044921875, 0.074462890625, 0.10400390625, 0.133544921875, 0.1630859375, 0.192626953125, 0.22216796875, 0.251708984375, 0.28125, 0.310791015625, 0.34033203125, 0.369873046875, 0.3994140625, 0.428955078125, 0.45849609375, 0.488037109375, 0.517578125, 0.547119140625, 0.57666015625, 0.606201171875, 0.6357421875, 0.665283203125, 0.69482421875, 0.724365234375, 0.75390625, 0.783447265625, 0.81298828125, 0.842529296875, 0.8720703125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 10.0, 9.0, 11.0, 8.0, 19.0, 31.0, 32.0, 35.0, 69.0, 98.0, 117.0, 120.0, 114.0, 86.0, 87.0, 44.0, 29.0, 25.0, 13.0, 12.0, 9.0, 6.0, 2.0, 6.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00021505355834960938, -0.0002069510519504547, -0.00019884854555130005, -0.00019074603915214539, -0.00018264353275299072, -0.00017454102635383606, -0.0001664385199546814, -0.00015833601355552673, -0.00015023350715637207, -0.0001421310007572174, -0.00013402849435806274, -0.00012592598795890808, -0.00011782348155975342, -0.00010972097516059875, -0.00010161846876144409, -9.351596236228943e-05, -8.541345596313477e-05, -7.73109495639801e-05, -6.920844316482544e-05, -6.110593676567078e-05, -5.300343036651611e-05, -4.490092396736145e-05, -3.679841756820679e-05, -2.8695911169052124e-05, -2.059340476989746e-05, -1.2490898370742798e-05, -4.388391971588135e-06, 3.7141144275665283e-06, 1.1816620826721191e-05, 1.9919127225875854e-05, 2.8021633625030518e-05, 3.612414002418518e-05, 4.4226646423339844e-05, 5.232915282249451e-05, 6.043165922164917e-05, 6.853416562080383e-05, 7.66366720199585e-05, 8.473917841911316e-05, 9.284168481826782e-05, 0.00010094419121742249, 0.00010904669761657715, 0.00011714920401573181, 0.00012525171041488647, 0.00013335421681404114, 0.0001414567232131958, 0.00014955922961235046, 0.00015766173601150513, 0.0001657642424106598, 0.00017386674880981445, 0.00018196925520896912, 0.00019007176160812378, 0.00019817426800727844, 0.0002062767744064331, 0.00021437928080558777, 0.00022248178720474243, 0.0002305842936038971, 0.00023868680000305176, 0.0002467893064022064, 0.0002548918128013611, 0.00026299431920051575, 0.0002710968255996704, 0.0002791993319988251, 0.00028730183839797974, 0.0002954043447971344, 0.00030350685119628906]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 8.0, 10.0, 14.0, 20.0, 23.0, 48.0, 81.0, 162.0, 325.0, 645.0, 1574.0, 5123.0, 28776.0, 324271.0, 632019.0, 45118.0, 6863.0, 1929.0, 775.0, 356.0, 193.0, 81.0, 62.0, 33.0, 15.0, 12.0, 11.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.73046875, -0.7035140991210938, -0.6765594482421875, -0.6496047973632812, -0.622650146484375, -0.5956954956054688, -0.5687408447265625, -0.5417861938476562, -0.51483154296875, -0.48787689208984375, -0.4609222412109375, -0.43396759033203125, -0.407012939453125, -0.38005828857421875, -0.3531036376953125, -0.32614898681640625, -0.2991943359375, -0.27223968505859375, -0.2452850341796875, -0.21833038330078125, -0.191375732421875, -0.16442108154296875, -0.1374664306640625, -0.11051177978515625, -0.08355712890625, -0.05660247802734375, -0.0296478271484375, -0.00269317626953125, 0.024261474609375, 0.05121612548828125, 0.0781707763671875, 0.10512542724609375, 0.132080078125, 0.15903472900390625, 0.1859893798828125, 0.21294403076171875, 0.239898681640625, 0.26685333251953125, 0.2938079833984375, 0.32076263427734375, 0.34771728515625, 0.37467193603515625, 0.4016265869140625, 0.42858123779296875, 0.455535888671875, 0.48249053955078125, 0.5094451904296875, 0.5363998413085938, 0.5633544921875, 0.5903091430664062, 0.6172637939453125, 0.6442184448242188, 0.671173095703125, 0.6981277465820312, 0.7250823974609375, 0.7520370483398438, 0.77899169921875, 0.8059463500976562, 0.8329010009765625, 0.8598556518554688, 0.886810302734375, 0.9137649536132812, 0.9407196044921875, 0.9676742553710938, 0.99462890625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 4.0, 4.0, 7.0, 3.0, 9.0, 21.0, 30.0, 34.0, 37.0, 52.0, 56.0, 80.0, 91.0, 87.0, 91.0, 93.0, 77.0, 56.0, 57.0, 43.0, 18.0, 17.0, 11.0, 9.0, 7.0, 3.0, 5.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.43408203125, -0.40940093994140625, -0.3847198486328125, -0.36003875732421875, -0.335357666015625, -0.31067657470703125, -0.2859954833984375, -0.26131439208984375, -0.23663330078125, -0.21195220947265625, -0.1872711181640625, -0.16259002685546875, -0.137908935546875, -0.11322784423828125, -0.0885467529296875, -0.06386566162109375, -0.0391845703125, -0.01450347900390625, 0.0101776123046875, 0.03485870361328125, 0.059539794921875, 0.08422088623046875, 0.1089019775390625, 0.13358306884765625, 0.15826416015625, 0.18294525146484375, 0.2076263427734375, 0.23230743408203125, 0.256988525390625, 0.28166961669921875, 0.3063507080078125, 0.33103179931640625, 0.355712890625, 0.38039398193359375, 0.4050750732421875, 0.42975616455078125, 0.454437255859375, 0.47911834716796875, 0.5037994384765625, 0.5284805297851562, 0.55316162109375, 0.5778427124023438, 0.6025238037109375, 0.6272048950195312, 0.651885986328125, 0.6765670776367188, 0.7012481689453125, 0.7259292602539062, 0.7506103515625, 0.7752914428710938, 0.7999725341796875, 0.8246536254882812, 0.849334716796875, 0.8740158081054688, 0.8986968994140625, 0.9233779907226562, 0.94805908203125, 0.9727401733398438, 0.9974212646484375, 1.0221023559570312, 1.046783447265625, 1.0714645385742188, 1.0961456298828125, 1.1208267211914062, 1.1455078125]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 6.0, 13.0, 21.0, 43.0, 82.0, 117.0, 259.0, 204.0, 113.0, 63.0, 33.0, 13.0, 15.0, 9.0, 7.0, 2.0, 1.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.277312278747559, -12.66807746887207, -12.058841705322266, -11.449606895446777, -10.840372085571289, -10.231136322021484, -9.621901512145996, -9.012666702270508, -8.403430938720703, -7.794195652008057, -7.18496036529541, -6.575725555419922, -5.966490268707275, -5.357254981994629, -4.748020172119141, -4.138784885406494, -3.5295495986938477, -2.920314311981201, -2.311079263687134, -1.7018440961837769, -1.09260892868042, -0.48337364196777344, 0.12586140632629395, 0.7350964546203613, 1.3443317413330078, 1.9535669088363647, 2.5628020763397217, 3.172037124633789, 3.7812724113464355, 4.390507698059082, 4.99974250793457, 5.608977794647217, 6.21821403503418, 6.827449321746826, 7.436684608459473, 8.045919418334961, 8.655155181884766, 9.264389991760254, 9.873624801635742, 10.482860565185547, 11.092095375061035, 11.701330184936523, 12.310565948486328, 12.919800758361816, 13.529035568237305, 14.13827133178711, 14.747506141662598, 15.356740951538086, 15.96597671508789, 16.575212478637695, 17.184446334838867, 17.793682098388672, 18.402917861938477, 19.01215362548828, 19.621387481689453, 20.230623245239258, 20.839859008789062, 21.449094772338867, 22.05832862854004, 22.667564392089844, 23.27680015563965, 23.886035919189453, 24.495269775390625, 25.10450553894043, 25.7137393951416]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 3.0, 2.0, 4.0, 4.0, 10.0, 11.0, 9.0, 12.0, 18.0, 10.0, 10.0, 13.0, 22.0, 26.0, 29.0, 41.0, 34.0, 29.0, 34.0, 71.0, 79.0, 85.0, 70.0, 55.0, 44.0, 37.0, 36.0, 33.0, 28.0, 26.0, 13.0, 22.0, 17.0, 9.0, 11.0, 11.0, 5.0, 12.0, 8.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.883549690246582, -13.452656745910645, -13.02176284790039, -12.590869903564453, -12.159976959228516, -11.729084014892578, -11.29819107055664, -10.867297172546387, -10.43640422821045, -10.005511283874512, -9.574617385864258, -9.14372444152832, -8.712831497192383, -8.281938552856445, -7.85104513168335, -7.420151710510254, -6.989258766174316, -6.558365821838379, -6.127472400665283, -5.6965789794921875, -5.26568603515625, -4.8347930908203125, -4.403899669647217, -3.9730064868927, -3.5421133041381836, -3.111220121383667, -2.6803269386291504, -2.249433755874634, -1.8185405731201172, -1.3876473903656006, -0.956754207611084, -0.5258610248565674, -0.09496688842773438, 0.3359262943267822, 0.7668194770812988, 1.1977126598358154, 1.628605842590332, 2.0594990253448486, 2.4903922080993652, 2.921285390853882, 3.3521785736083984, 3.783071756362915, 4.213964939117432, 4.644858360290527, 5.075751304626465, 5.506644248962402, 5.937537670135498, 6.368431091308594, 6.799324035644531, 7.230216979980469, 7.6611104011535645, 8.09200382232666, 8.522896766662598, 8.953789710998535, 9.384683609008789, 9.815576553344727, 10.246469497680664, 10.677362442016602, 11.108255386352539, 11.539149284362793, 11.97004222869873, 12.400935173034668, 12.831829071044922, 13.26272201538086, 13.693614959716797]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 14.0, 13.0, 19.0, 43.0, 58.0, 95.0, 187.0, 385.0, 889.0, 2632.0, 9492.0, 55217.0, 630481.0, 2895416.0, 534025.0, 51102.0, 9878.0, 2646.0, 893.0, 378.0, 179.0, 81.0, 50.0, 39.0, 21.0, 18.0, 9.0, 6.0, 1.0, 7.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.4296875, -1.3904876708984375, -1.351287841796875, -1.3120880126953125, -1.27288818359375, -1.2336883544921875, -1.194488525390625, -1.1552886962890625, -1.1160888671875, -1.0768890380859375, -1.037689208984375, -0.9984893798828125, -0.95928955078125, -0.9200897216796875, -0.880889892578125, -0.8416900634765625, -0.802490234375, -0.7632904052734375, -0.724090576171875, -0.6848907470703125, -0.64569091796875, -0.6064910888671875, -0.567291259765625, -0.5280914306640625, -0.4888916015625, -0.4496917724609375, -0.410491943359375, -0.3712921142578125, -0.33209228515625, -0.2928924560546875, -0.253692626953125, -0.2144927978515625, -0.17529296875, -0.1360931396484375, -0.096893310546875, -0.0576934814453125, -0.01849365234375, 0.0207061767578125, 0.059906005859375, 0.0991058349609375, 0.1383056640625, 0.1775054931640625, 0.216705322265625, 0.2559051513671875, 0.29510498046875, 0.3343048095703125, 0.373504638671875, 0.4127044677734375, 0.451904296875, 0.4911041259765625, 0.530303955078125, 0.5695037841796875, 0.60870361328125, 0.6479034423828125, 0.687103271484375, 0.7263031005859375, 0.7655029296875, 0.8047027587890625, 0.843902587890625, 0.8831024169921875, 0.92230224609375, 0.9615020751953125, 1.000701904296875, 1.0399017333984375, 1.0791015625]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 6.0, 7.0, 8.0, 14.0, 20.0, 15.0, 30.0, 31.0, 36.0, 43.0, 44.0, 66.0, 51.0, 71.0, 58.0, 55.0, 52.0, 61.0, 46.0, 40.0, 38.0, 42.0, 41.0, 24.0, 33.0, 13.0, 14.0, 12.0, 9.0, 5.0, 6.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.06640625, -1.0360107421875, -1.005615234375, -0.9752197265625, -0.94482421875, -0.9144287109375, -0.884033203125, -0.8536376953125, -0.8232421875, -0.7928466796875, -0.762451171875, -0.7320556640625, -0.70166015625, -0.6712646484375, -0.640869140625, -0.6104736328125, -0.580078125, -0.5496826171875, -0.519287109375, -0.4888916015625, -0.45849609375, -0.4281005859375, -0.397705078125, -0.3673095703125, -0.3369140625, -0.3065185546875, -0.276123046875, -0.2457275390625, -0.21533203125, -0.1849365234375, -0.154541015625, -0.1241455078125, -0.09375, -0.0633544921875, -0.032958984375, -0.0025634765625, 0.02783203125, 0.0582275390625, 0.088623046875, 0.1190185546875, 0.1494140625, 0.1798095703125, 0.210205078125, 0.2406005859375, 0.27099609375, 0.3013916015625, 0.331787109375, 0.3621826171875, 0.392578125, 0.4229736328125, 0.453369140625, 0.4837646484375, 0.51416015625, 0.5445556640625, 0.574951171875, 0.6053466796875, 0.6357421875, 0.6661376953125, 0.696533203125, 0.7269287109375, 0.75732421875, 0.7877197265625, 0.818115234375, 0.8485107421875, 0.87890625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 6.0, 6.0, 5.0, 3.0, 12.0, 15.0, 29.0, 37.0, 47.0, 102.0, 165.0, 246.0, 542.0, 1134.0, 2808.0, 9240.0, 43062.0, 521962.0, 3370967.0, 208960.0, 25516.0, 5862.0, 1859.0, 808.0, 377.0, 202.0, 112.0, 63.0, 41.0, 29.0, 16.0, 13.0, 10.0, 10.0, 6.0, 4.0, 4.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6513671875, -1.6003265380859375, -1.549285888671875, -1.4982452392578125, -1.44720458984375, -1.3961639404296875, -1.345123291015625, -1.2940826416015625, -1.2430419921875, -1.1920013427734375, -1.140960693359375, -1.0899200439453125, -1.03887939453125, -0.9878387451171875, -0.936798095703125, -0.8857574462890625, -0.834716796875, -0.7836761474609375, -0.732635498046875, -0.6815948486328125, -0.63055419921875, -0.5795135498046875, -0.528472900390625, -0.4774322509765625, -0.4263916015625, -0.3753509521484375, -0.324310302734375, -0.2732696533203125, -0.22222900390625, -0.1711883544921875, -0.120147705078125, -0.0691070556640625, -0.01806640625, 0.0329742431640625, 0.084014892578125, 0.1350555419921875, 0.18609619140625, 0.2371368408203125, 0.288177490234375, 0.3392181396484375, 0.3902587890625, 0.4412994384765625, 0.492340087890625, 0.5433807373046875, 0.59442138671875, 0.6454620361328125, 0.696502685546875, 0.7475433349609375, 0.798583984375, 0.8496246337890625, 0.900665283203125, 0.9517059326171875, 1.00274658203125, 1.0537872314453125, 1.104827880859375, 1.1558685302734375, 1.2069091796875, 1.2579498291015625, 1.308990478515625, 1.3600311279296875, 1.41107177734375, 1.4621124267578125, 1.513153076171875, 1.5641937255859375, 1.615234375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 4.0, 0.0, 3.0, 5.0, 1.0, 5.0, 8.0, 10.0, 9.0, 14.0, 10.0, 23.0, 24.0, 29.0, 46.0, 64.0, 117.0, 198.0, 271.0, 442.0, 570.0, 631.0, 502.0, 385.0, 247.0, 155.0, 90.0, 54.0, 44.0, 34.0, 17.0, 14.0, 14.0, 9.0, 6.0, 9.0, 6.0, 4.0, 4.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.345703125, -1.2996063232421875, -1.253509521484375, -1.2074127197265625, -1.16131591796875, -1.1152191162109375, -1.069122314453125, -1.0230255126953125, -0.9769287109375, -0.9308319091796875, -0.884735107421875, -0.8386383056640625, -0.79254150390625, -0.7464447021484375, -0.700347900390625, -0.6542510986328125, -0.608154296875, -0.5620574951171875, -0.515960693359375, -0.4698638916015625, -0.42376708984375, -0.3776702880859375, -0.331573486328125, -0.2854766845703125, -0.2393798828125, -0.1932830810546875, -0.147186279296875, -0.1010894775390625, -0.05499267578125, -0.0088958740234375, 0.037200927734375, 0.0832977294921875, 0.12939453125, 0.1754913330078125, 0.221588134765625, 0.2676849365234375, 0.31378173828125, 0.3598785400390625, 0.405975341796875, 0.4520721435546875, 0.4981689453125, 0.5442657470703125, 0.590362548828125, 0.6364593505859375, 0.68255615234375, 0.7286529541015625, 0.774749755859375, 0.8208465576171875, 0.866943359375, 0.9130401611328125, 0.959136962890625, 1.0052337646484375, 1.05133056640625, 1.0974273681640625, 1.143524169921875, 1.1896209716796875, 1.2357177734375, 1.2818145751953125, 1.327911376953125, 1.3740081787109375, 1.42010498046875, 1.4662017822265625, 1.512298583984375, 1.5583953857421875, 1.6044921875]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 6.0, 23.0, 61.0, 427.0, 396.0, 64.0, 16.0, 7.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.95310592651367, -48.634666442871094, -47.31623077392578, -45.9977912902832, -44.679351806640625, -43.36091613769531, -42.042476654052734, -40.724037170410156, -39.405601501464844, -38.087162017822266, -36.76872634887695, -35.450286865234375, -34.13185119628906, -32.813411712646484, -31.494972229003906, -30.17653465270996, -28.858097076416016, -27.53965950012207, -26.221221923828125, -24.902782440185547, -23.5843448638916, -22.265907287597656, -20.947467803955078, -19.629030227661133, -18.310592651367188, -16.992155075073242, -15.67371654510498, -14.355278015136719, -13.036840438842773, -11.718402862548828, -10.399964332580566, -9.081525802612305, -7.763092041015625, -6.4446539878845215, -5.126215934753418, -3.8077778816223145, -2.489339828491211, -1.1709017753601074, 0.1475362777709961, 1.4659748077392578, 2.784412384033203, 4.102850437164307, 5.42128849029541, 6.739726543426514, 8.058164596557617, 9.376602172851562, 10.695040702819824, 12.013479232788086, 13.331916809082031, 14.650354385375977, 15.968792915344238, 17.2872314453125, 18.605669021606445, 19.92410659790039, 21.24254608154297, 22.560983657836914, 23.87942123413086, 25.197858810424805, 26.51629638671875, 27.834735870361328, 29.153173446655273, 30.47161102294922, 31.790050506591797, 33.108489990234375, 34.42692565917969]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 6.0, 8.0, 14.0, 13.0, 9.0, 16.0, 27.0, 17.0, 18.0, 36.0, 28.0, 44.0, 52.0, 58.0, 48.0, 59.0, 60.0, 60.0, 44.0, 57.0, 36.0, 53.0, 31.0, 35.0, 32.0, 32.0, 22.0, 23.0, 16.0, 13.0, 10.0, 10.0, 3.0, 4.0, 4.0, 4.0, 3.0, 2.0, 2.0, 2.0, 2.0], "bins": [-10.923690795898438, -10.651545524597168, -10.379400253295898, -10.107254981994629, -9.83510971069336, -9.56296443939209, -9.29081916809082, -9.018672943115234, -8.746528625488281, -8.474383354187012, -8.202238082885742, -7.930092811584473, -7.657947540283203, -7.385802268981934, -7.113656520843506, -6.841511249542236, -6.569365501403809, -6.297220230102539, -6.0250749588012695, -5.7529296875, -5.4807844161987305, -5.208639144897461, -4.936493396759033, -4.664348125457764, -4.392202854156494, -4.120057582855225, -3.847912311553955, -3.5757668018341064, -3.303621530532837, -3.0314762592315674, -2.7593307495117188, -2.487185478210449, -2.215041160583496, -1.9428958892822266, -1.6707504987716675, -1.3986051082611084, -1.1264598369598389, -0.8543145656585693, -0.5821691751480103, -0.31002378463745117, -0.03787851333618164, 0.23426681756973267, 0.506412148475647, 0.7785574793815613, 1.0507028102874756, 1.3228480815887451, 1.5949934720993042, 1.8671388626098633, 2.139284133911133, 2.4114294052124023, 2.683574676513672, 2.9557201862335205, 3.22786545753479, 3.5000107288360596, 3.772156238555908, 4.044301509857178, 4.316446781158447, 4.588592052459717, 4.860737323760986, 5.132882595062256, 5.405028343200684, 5.677173614501953, 5.949318885803223, 6.221464157104492, 6.493609428405762]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 7.0, 5.0, 9.0, 7.0, 26.0, 28.0, 49.0, 96.0, 124.0, 209.0, 370.0, 533.0, 935.0, 1696.0, 2816.0, 5194.0, 9801.0, 19132.0, 38872.0, 79475.0, 155023.0, 235557.0, 224028.0, 136496.0, 68695.0, 33501.0, 16688.0, 8562.0, 4529.0, 2497.0, 1395.0, 868.0, 512.0, 299.0, 184.0, 130.0, 82.0, 45.0, 27.0, 23.0, 13.0, 5.0, 6.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.89892578125, -0.8707427978515625, -0.842559814453125, -0.8143768310546875, -0.78619384765625, -0.7580108642578125, -0.729827880859375, -0.7016448974609375, -0.6734619140625, -0.6452789306640625, -0.617095947265625, -0.5889129638671875, -0.56072998046875, -0.5325469970703125, -0.504364013671875, -0.4761810302734375, -0.447998046875, -0.4198150634765625, -0.391632080078125, -0.3634490966796875, -0.33526611328125, -0.3070831298828125, -0.278900146484375, -0.2507171630859375, -0.2225341796875, -0.1943511962890625, -0.166168212890625, -0.1379852294921875, -0.10980224609375, -0.0816192626953125, -0.053436279296875, -0.0252532958984375, 0.0029296875, 0.0311126708984375, 0.059295654296875, 0.0874786376953125, 0.11566162109375, 0.1438446044921875, 0.172027587890625, 0.2002105712890625, 0.2283935546875, 0.2565765380859375, 0.284759521484375, 0.3129425048828125, 0.34112548828125, 0.3693084716796875, 0.397491455078125, 0.4256744384765625, 0.453857421875, 0.4820404052734375, 0.510223388671875, 0.5384063720703125, 0.56658935546875, 0.5947723388671875, 0.622955322265625, 0.6511383056640625, 0.6793212890625, 0.7075042724609375, 0.735687255859375, 0.7638702392578125, 0.79205322265625, 0.8202362060546875, 0.848419189453125, 0.8766021728515625, 0.90478515625]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 4.0, 3.0, 11.0, 4.0, 10.0, 11.0, 20.0, 23.0, 29.0, 25.0, 36.0, 35.0, 39.0, 63.0, 51.0, 50.0, 62.0, 59.0, 61.0, 55.0, 39.0, 39.0, 49.0, 37.0, 24.0, 28.0, 34.0, 13.0, 20.0, 21.0, 14.0, 9.0, 6.0, 6.0, 7.0, 3.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.013671875, -0.984344482421875, -0.95501708984375, -0.925689697265625, -0.8963623046875, -0.867034912109375, -0.83770751953125, -0.808380126953125, -0.779052734375, -0.749725341796875, -0.72039794921875, -0.691070556640625, -0.6617431640625, -0.632415771484375, -0.60308837890625, -0.573760986328125, -0.54443359375, -0.515106201171875, -0.48577880859375, -0.456451416015625, -0.4271240234375, -0.397796630859375, -0.36846923828125, -0.339141845703125, -0.309814453125, -0.280487060546875, -0.25115966796875, -0.221832275390625, -0.1925048828125, -0.163177490234375, -0.13385009765625, -0.104522705078125, -0.0751953125, -0.045867919921875, -0.01654052734375, 0.012786865234375, 0.0421142578125, 0.071441650390625, 0.10076904296875, 0.130096435546875, 0.159423828125, 0.188751220703125, 0.21807861328125, 0.247406005859375, 0.2767333984375, 0.306060791015625, 0.33538818359375, 0.364715576171875, 0.39404296875, 0.423370361328125, 0.45269775390625, 0.482025146484375, 0.5113525390625, 0.540679931640625, 0.57000732421875, 0.599334716796875, 0.628662109375, 0.657989501953125, 0.68731689453125, 0.716644287109375, 0.7459716796875, 0.775299072265625, 0.80462646484375, 0.833953857421875, 0.86328125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 9.0, 4.0, 10.0, 9.0, 18.0, 16.0, 39.0, 38.0, 58.0, 75.0, 128.0, 217.0, 428.0, 1083.0, 3454.0, 15112.0, 89748.0, 626788.0, 259822.0, 40284.0, 7592.0, 2001.0, 743.0, 338.0, 184.0, 95.0, 86.0, 57.0, 35.0, 22.0, 15.0, 15.0, 14.0, 10.0, 6.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.328125, -2.257110595703125, -2.18609619140625, -2.115081787109375, -2.0440673828125, -1.973052978515625, -1.90203857421875, -1.831024169921875, -1.760009765625, -1.688995361328125, -1.61798095703125, -1.546966552734375, -1.4759521484375, -1.404937744140625, -1.33392333984375, -1.262908935546875, -1.19189453125, -1.120880126953125, -1.04986572265625, -0.978851318359375, -0.9078369140625, -0.836822509765625, -0.76580810546875, -0.694793701171875, -0.623779296875, -0.552764892578125, -0.48175048828125, -0.410736083984375, -0.3397216796875, -0.268707275390625, -0.19769287109375, -0.126678466796875, -0.0556640625, 0.015350341796875, 0.08636474609375, 0.157379150390625, 0.2283935546875, 0.299407958984375, 0.37042236328125, 0.441436767578125, 0.512451171875, 0.583465576171875, 0.65447998046875, 0.725494384765625, 0.7965087890625, 0.867523193359375, 0.93853759765625, 1.009552001953125, 1.08056640625, 1.151580810546875, 1.22259521484375, 1.293609619140625, 1.3646240234375, 1.435638427734375, 1.50665283203125, 1.577667236328125, 1.648681640625, 1.719696044921875, 1.79071044921875, 1.861724853515625, 1.9327392578125, 2.003753662109375, 2.07476806640625, 2.145782470703125, 2.216796875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 4.0, 10.0, 12.0, 13.0, 18.0, 20.0, 15.0, 25.0, 25.0, 34.0, 41.0, 32.0, 41.0, 55.0, 45.0, 54.0, 52.0, 60.0, 51.0, 49.0, 36.0, 43.0, 35.0, 39.0, 32.0, 19.0, 25.0, 22.0, 21.0, 12.0, 12.0, 10.0, 6.0, 5.0, 5.0, 6.0, 2.0, 1.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.0390625, -2.94879150390625, -2.8585205078125, -2.76824951171875, -2.677978515625, -2.58770751953125, -2.4974365234375, -2.40716552734375, -2.31689453125, -2.22662353515625, -2.1363525390625, -2.04608154296875, -1.955810546875, -1.86553955078125, -1.7752685546875, -1.68499755859375, -1.5947265625, -1.50445556640625, -1.4141845703125, -1.32391357421875, -1.233642578125, -1.14337158203125, -1.0531005859375, -0.96282958984375, -0.87255859375, -0.78228759765625, -0.6920166015625, -0.60174560546875, -0.511474609375, -0.42120361328125, -0.3309326171875, -0.24066162109375, -0.150390625, -0.06011962890625, 0.0301513671875, 0.12042236328125, 0.210693359375, 0.30096435546875, 0.3912353515625, 0.48150634765625, 0.57177734375, 0.66204833984375, 0.7523193359375, 0.84259033203125, 0.932861328125, 1.02313232421875, 1.1134033203125, 1.20367431640625, 1.2939453125, 1.38421630859375, 1.4744873046875, 1.56475830078125, 1.655029296875, 1.74530029296875, 1.8355712890625, 1.92584228515625, 2.01611328125, 2.10638427734375, 2.1966552734375, 2.28692626953125, 2.377197265625, 2.46746826171875, 2.5577392578125, 2.64801025390625, 2.73828125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 3.0, 3.0, 8.0, 12.0, 23.0, 27.0, 33.0, 59.0, 115.0, 185.0, 365.0, 913.0, 2413.0, 7340.0, 27607.0, 130535.0, 620114.0, 201151.0, 42087.0, 10268.0, 3163.0, 1094.0, 495.0, 226.0, 120.0, 60.0, 44.0, 31.0, 15.0, 15.0, 4.0, 11.0, 7.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.57470703125, -0.557098388671875, -0.53948974609375, -0.521881103515625, -0.5042724609375, -0.486663818359375, -0.46905517578125, -0.451446533203125, -0.433837890625, -0.416229248046875, -0.39862060546875, -0.381011962890625, -0.3634033203125, -0.345794677734375, -0.32818603515625, -0.310577392578125, -0.29296875, -0.275360107421875, -0.25775146484375, -0.240142822265625, -0.2225341796875, -0.204925537109375, -0.18731689453125, -0.169708251953125, -0.152099609375, -0.134490966796875, -0.11688232421875, -0.099273681640625, -0.0816650390625, -0.064056396484375, -0.04644775390625, -0.028839111328125, -0.01123046875, 0.006378173828125, 0.02398681640625, 0.041595458984375, 0.0592041015625, 0.076812744140625, 0.09442138671875, 0.112030029296875, 0.129638671875, 0.147247314453125, 0.16485595703125, 0.182464599609375, 0.2000732421875, 0.217681884765625, 0.23529052734375, 0.252899169921875, 0.2705078125, 0.288116455078125, 0.30572509765625, 0.323333740234375, 0.3409423828125, 0.358551025390625, 0.37615966796875, 0.393768310546875, 0.411376953125, 0.428985595703125, 0.44659423828125, 0.464202880859375, 0.4818115234375, 0.499420166015625, 0.51702880859375, 0.534637451171875, 0.55224609375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 7.0, 6.0, 10.0, 10.0, 10.0, 11.0, 23.0, 31.0, 35.0, 50.0, 65.0, 61.0, 82.0, 81.0, 95.0, 94.0, 78.0, 52.0, 42.0, 31.0, 24.0, 24.0, 20.0, 13.0, 10.0, 7.0, 6.0, 8.0, 6.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.00017845630645751953, -0.0001732315868139267, -0.00016800686717033386, -0.00016278214752674103, -0.0001575574278831482, -0.00015233270823955536, -0.00014710798859596252, -0.0001418832689523697, -0.00013665854930877686, -0.00013143382966518402, -0.0001262091100215912, -0.00012098439037799835, -0.00011575967073440552, -0.00011053495109081268, -0.00010531023144721985, -0.00010008551180362701, -9.486079216003418e-05, -8.963607251644135e-05, -8.441135287284851e-05, -7.918663322925568e-05, -7.396191358566284e-05, -6.873719394207001e-05, -6.351247429847717e-05, -5.828775465488434e-05, -5.3063035011291504e-05, -4.783831536769867e-05, -4.2613595724105835e-05, -3.7388876080513e-05, -3.2164156436920166e-05, -2.693943679332733e-05, -2.1714717149734497e-05, -1.6489997506141663e-05, -1.1265277862548828e-05, -6.040558218955994e-06, -8.158385753631592e-07, 4.408881068229675e-06, 9.63360071182251e-06, 1.4858320355415344e-05, 2.008303999900818e-05, 2.5307759642601013e-05, 3.053247928619385e-05, 3.575719892978668e-05, 4.0981918573379517e-05, 4.620663821697235e-05, 5.1431357860565186e-05, 5.665607750415802e-05, 6.188079714775085e-05, 6.710551679134369e-05, 7.233023643493652e-05, 7.755495607852936e-05, 8.277967572212219e-05, 8.800439536571503e-05, 9.322911500930786e-05, 9.84538346529007e-05, 0.00010367855429649353, 0.00010890327394008636, 0.0001141279935836792, 0.00011935271322727203, 0.00012457743287086487, 0.0001298021525144577, 0.00013502687215805054, 0.00014025159180164337, 0.0001454763114452362, 0.00015070103108882904, 0.00015592575073242188]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 5.0, 6.0, 5.0, 10.0, 17.0, 25.0, 15.0, 63.0, 104.0, 184.0, 418.0, 1155.0, 3856.0, 19141.0, 149111.0, 718847.0, 132845.0, 17342.0, 3495.0, 1074.0, 408.0, 201.0, 74.0, 62.0, 30.0, 23.0, 15.0, 10.0, 6.0, 10.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.60888671875, -0.5849838256835938, -0.5610809326171875, -0.5371780395507812, -0.513275146484375, -0.48937225341796875, -0.4654693603515625, -0.44156646728515625, -0.41766357421875, -0.39376068115234375, -0.3698577880859375, -0.34595489501953125, -0.322052001953125, -0.29814910888671875, -0.2742462158203125, -0.25034332275390625, -0.2264404296875, -0.20253753662109375, -0.1786346435546875, -0.15473175048828125, -0.130828857421875, -0.10692596435546875, -0.0830230712890625, -0.05912017822265625, -0.03521728515625, -0.01131439208984375, 0.0125885009765625, 0.03649139404296875, 0.060394287109375, 0.08429718017578125, 0.1082000732421875, 0.13210296630859375, 0.156005859375, 0.17990875244140625, 0.2038116455078125, 0.22771453857421875, 0.251617431640625, 0.27552032470703125, 0.2994232177734375, 0.32332611083984375, 0.34722900390625, 0.37113189697265625, 0.3950347900390625, 0.41893768310546875, 0.442840576171875, 0.46674346923828125, 0.4906463623046875, 0.5145492553710938, 0.5384521484375, 0.5623550415039062, 0.5862579345703125, 0.6101608276367188, 0.634063720703125, 0.6579666137695312, 0.6818695068359375, 0.7057723999023438, 0.72967529296875, 0.7535781860351562, 0.7774810791015625, 0.8013839721679688, 0.825286865234375, 0.8491897583007812, 0.8730926513671875, 0.8969955444335938, 0.9208984375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 7.0, 1.0, 12.0, 11.0, 10.0, 12.0, 19.0, 24.0, 23.0, 29.0, 38.0, 57.0, 55.0, 59.0, 71.0, 71.0, 67.0, 82.0, 46.0, 50.0, 62.0, 47.0, 34.0, 17.0, 20.0, 19.0, 15.0, 8.0, 8.0, 7.0, 3.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47998046875, -0.46233367919921875, -0.4446868896484375, -0.42704010009765625, -0.409393310546875, -0.39174652099609375, -0.3740997314453125, -0.35645294189453125, -0.33880615234375, -0.32115936279296875, -0.3035125732421875, -0.28586578369140625, -0.268218994140625, -0.25057220458984375, -0.2329254150390625, -0.21527862548828125, -0.1976318359375, -0.17998504638671875, -0.1623382568359375, -0.14469146728515625, -0.127044677734375, -0.10939788818359375, -0.0917510986328125, -0.07410430908203125, -0.05645751953125, -0.03881072998046875, -0.0211639404296875, -0.00351715087890625, 0.014129638671875, 0.03177642822265625, 0.0494232177734375, 0.06707000732421875, 0.084716796875, 0.10236358642578125, 0.1200103759765625, 0.13765716552734375, 0.155303955078125, 0.17295074462890625, 0.1905975341796875, 0.20824432373046875, 0.22589111328125, 0.24353790283203125, 0.2611846923828125, 0.27883148193359375, 0.296478271484375, 0.31412506103515625, 0.3317718505859375, 0.34941864013671875, 0.3670654296875, 0.38471221923828125, 0.4023590087890625, 0.42000579833984375, 0.437652587890625, 0.45529937744140625, 0.4729461669921875, 0.49059295654296875, 0.50823974609375, 0.5258865356445312, 0.5435333251953125, 0.5611801147460938, 0.578826904296875, 0.5964736938476562, 0.6141204833984375, 0.6317672729492188, 0.6494140625]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 5.0, 8.0, 4.0, 6.0, 23.0, 29.0, 82.0, 152.0, 238.0, 221.0, 123.0, 57.0, 20.0, 11.0, 5.0, 1.0, 3.0, 6.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-25.959287643432617, -25.39434242248535, -24.829397201538086, -24.26445198059082, -23.699506759643555, -23.13456153869629, -22.569616317749023, -22.004671096801758, -21.439725875854492, -20.874780654907227, -20.30983543395996, -19.744890213012695, -19.17994499206543, -18.614999771118164, -18.0500545501709, -17.485109329223633, -16.920166015625, -16.355220794677734, -15.790275573730469, -15.225330352783203, -14.660385131835938, -14.095439910888672, -13.530494689941406, -12.96554946899414, -12.400604248046875, -11.83565902709961, -11.270713806152344, -10.705768585205078, -10.140823364257812, -9.575878143310547, -9.010932922363281, -8.445987701416016, -7.881043434143066, -7.316098213195801, -6.751152992248535, -6.1862077713012695, -5.621262550354004, -5.056317329406738, -4.491372585296631, -3.9264273643493652, -3.3614821434020996, -2.796536922454834, -2.2315917015075684, -1.6666467189788818, -1.1017014980316162, -0.5367562770843506, 0.028188705444335938, 0.5931339263916016, 1.1580791473388672, 1.7230243682861328, 2.2879695892333984, 2.852914571762085, 3.4178597927093506, 3.982805013656616, 4.547749996185303, 5.112695217132568, 5.677640438079834, 6.2425856590271, 6.807530879974365, 7.372475624084473, 7.937420845031738, 8.502366065979004, 9.06731128692627, 9.632256507873535, 10.1972017288208]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 1.0, 0.0, 7.0, 7.0, 4.0, 1.0, 5.0, 8.0, 9.0, 17.0, 11.0, 15.0, 19.0, 19.0, 13.0, 30.0, 23.0, 28.0, 35.0, 48.0, 50.0, 68.0, 65.0, 64.0, 65.0, 53.0, 31.0, 33.0, 34.0, 24.0, 31.0, 23.0, 21.0, 17.0, 23.0, 18.0, 16.0, 12.0, 14.0, 6.0, 6.0, 9.0, 6.0, 4.0, 4.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.511778831481934, -9.186701774597168, -8.861624717712402, -8.536547660827637, -8.211470603942871, -7.8863935470581055, -7.561316013336182, -7.236238956451416, -6.91116189956665, -6.586084842681885, -6.261007785797119, -5.9359307289123535, -5.61085319519043, -5.285776138305664, -4.960699081420898, -4.635622024536133, -4.310544967651367, -3.9854679107666016, -3.660390853881836, -3.335313558578491, -3.0102365016937256, -2.68515944480896, -2.3600821495056152, -2.0350050926208496, -1.709928035736084, -1.3848509788513184, -1.0597738027572632, -0.7346966862678528, -0.4096195697784424, -0.08454251289367676, 0.24053466320037842, 0.5656118392944336, 0.8906879425048828, 1.2157649993896484, 1.5408421754837036, 1.8659193515777588, 2.1909964084625244, 2.51607346534729, 2.8411507606506348, 3.1662278175354004, 3.491304874420166, 3.8163819313049316, 4.141458988189697, 4.466536045074463, 4.791613578796387, 5.116690635681152, 5.441767692565918, 5.766844749450684, 6.091921806335449, 6.416998863220215, 6.7420759201049805, 7.067152976989746, 7.392230033874512, 7.717307090759277, 8.042384147644043, 8.367462158203125, 8.69253921508789, 9.017616271972656, 9.342693328857422, 9.667770385742188, 9.992847442626953, 10.317924499511719, 10.643001556396484, 10.96807861328125, 11.293155670166016]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 3.0, 5.0, 8.0, 19.0, 24.0, 25.0, 53.0, 97.0, 135.0, 228.0, 447.0, 803.0, 1634.0, 3162.0, 7332.0, 19006.0, 53564.0, 170576.0, 543762.0, 1378455.0, 1297000.0, 485051.0, 152190.0, 48621.0, 17743.0, 7332.0, 3466.0, 1650.0, 801.0, 442.0, 272.0, 147.0, 77.0, 56.0, 31.0, 20.0, 19.0, 8.0, 5.0, 6.0, 4.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.505859375, -0.4883880615234375, -0.470916748046875, -0.4534454345703125, -0.43597412109375, -0.4185028076171875, -0.401031494140625, -0.3835601806640625, -0.3660888671875, -0.3486175537109375, -0.331146240234375, -0.3136749267578125, -0.29620361328125, -0.2787322998046875, -0.261260986328125, -0.2437896728515625, -0.226318359375, -0.2088470458984375, -0.191375732421875, -0.1739044189453125, -0.15643310546875, -0.1389617919921875, -0.121490478515625, -0.1040191650390625, -0.0865478515625, -0.0690765380859375, -0.051605224609375, -0.0341339111328125, -0.01666259765625, 0.0008087158203125, 0.018280029296875, 0.0357513427734375, 0.05322265625, 0.0706939697265625, 0.088165283203125, 0.1056365966796875, 0.12310791015625, 0.1405792236328125, 0.158050537109375, 0.1755218505859375, 0.1929931640625, 0.2104644775390625, 0.227935791015625, 0.2454071044921875, 0.26287841796875, 0.2803497314453125, 0.297821044921875, 0.3152923583984375, 0.332763671875, 0.3502349853515625, 0.367706298828125, 0.3851776123046875, 0.40264892578125, 0.4201202392578125, 0.437591552734375, 0.4550628662109375, 0.4725341796875, 0.4900054931640625, 0.507476806640625, 0.5249481201171875, 0.54241943359375, 0.5598907470703125, 0.577362060546875, 0.5948333740234375, 0.6123046875]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 3.0, 1.0, 2.0, 6.0, 8.0, 12.0, 9.0, 14.0, 17.0, 14.0, 20.0, 22.0, 28.0, 35.0, 37.0, 47.0, 46.0, 55.0, 45.0, 53.0, 52.0, 61.0, 52.0, 50.0, 40.0, 47.0, 34.0, 26.0, 33.0, 22.0, 27.0, 22.0, 14.0, 14.0, 12.0, 8.0, 4.0, 5.0, 3.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.96484375, -0.9368820190429688, -0.9089202880859375, -0.8809585571289062, -0.852996826171875, -0.8250350952148438, -0.7970733642578125, -0.7691116333007812, -0.74114990234375, -0.7131881713867188, -0.6852264404296875, -0.6572647094726562, -0.629302978515625, -0.6013412475585938, -0.5733795166015625, -0.5454177856445312, -0.5174560546875, -0.48949432373046875, -0.4615325927734375, -0.43357086181640625, -0.405609130859375, -0.37764739990234375, -0.3496856689453125, -0.32172393798828125, -0.29376220703125, -0.26580047607421875, -0.2378387451171875, -0.20987701416015625, -0.181915283203125, -0.15395355224609375, -0.1259918212890625, -0.09803009033203125, -0.070068359375, -0.04210662841796875, -0.0141448974609375, 0.01381683349609375, 0.041778564453125, 0.06974029541015625, 0.0977020263671875, 0.12566375732421875, 0.15362548828125, 0.18158721923828125, 0.2095489501953125, 0.23751068115234375, 0.265472412109375, 0.29343414306640625, 0.3213958740234375, 0.34935760498046875, 0.3773193359375, 0.40528106689453125, 0.4332427978515625, 0.46120452880859375, 0.489166259765625, 0.5171279907226562, 0.5450897216796875, 0.5730514526367188, 0.60101318359375, 0.6289749145507812, 0.6569366455078125, 0.6848983764648438, 0.712860107421875, 0.7408218383789062, 0.7687835693359375, 0.7967453002929688, 0.82470703125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 3.0, 8.0, 9.0, 19.0, 24.0, 23.0, 67.0, 121.0, 305.0, 893.0, 3611.0, 26262.0, 1118193.0, 2988474.0, 48750.0, 5562.0, 1213.0, 391.0, 142.0, 79.0, 44.0, 24.0, 16.0, 15.0, 10.0, 6.0, 7.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.236328125, -2.164459228515625, -2.09259033203125, -2.020721435546875, -1.9488525390625, -1.876983642578125, -1.80511474609375, -1.733245849609375, -1.661376953125, -1.589508056640625, -1.51763916015625, -1.445770263671875, -1.3739013671875, -1.302032470703125, -1.23016357421875, -1.158294677734375, -1.08642578125, -1.014556884765625, -0.94268798828125, -0.870819091796875, -0.7989501953125, -0.727081298828125, -0.65521240234375, -0.583343505859375, -0.511474609375, -0.439605712890625, -0.36773681640625, -0.295867919921875, -0.2239990234375, -0.152130126953125, -0.08026123046875, -0.008392333984375, 0.0634765625, 0.135345458984375, 0.20721435546875, 0.279083251953125, 0.3509521484375, 0.422821044921875, 0.49468994140625, 0.566558837890625, 0.638427734375, 0.710296630859375, 0.78216552734375, 0.854034423828125, 0.9259033203125, 0.997772216796875, 1.06964111328125, 1.141510009765625, 1.21337890625, 1.285247802734375, 1.35711669921875, 1.428985595703125, 1.5008544921875, 1.572723388671875, 1.64459228515625, 1.716461181640625, 1.788330078125, 1.860198974609375, 1.93206787109375, 2.003936767578125, 2.0758056640625, 2.147674560546875, 2.21954345703125, 2.291412353515625, 2.36328125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 8.0, 8.0, 2.0, 6.0, 7.0, 17.0, 17.0, 29.0, 39.0, 64.0, 74.0, 116.0, 174.0, 272.0, 369.0, 480.0, 539.0, 497.0, 414.0, 277.0, 209.0, 134.0, 81.0, 62.0, 41.0, 30.0, 17.0, 18.0, 14.0, 6.0, 8.0, 13.0, 5.0, 4.0, 5.0, 3.0, 1.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.2529296875, -1.213226318359375, -1.17352294921875, -1.133819580078125, -1.0941162109375, -1.054412841796875, -1.01470947265625, -0.975006103515625, -0.935302734375, -0.895599365234375, -0.85589599609375, -0.816192626953125, -0.7764892578125, -0.736785888671875, -0.69708251953125, -0.657379150390625, -0.61767578125, -0.577972412109375, -0.53826904296875, -0.498565673828125, -0.4588623046875, -0.419158935546875, -0.37945556640625, -0.339752197265625, -0.300048828125, -0.260345458984375, -0.22064208984375, -0.180938720703125, -0.1412353515625, -0.101531982421875, -0.06182861328125, -0.022125244140625, 0.017578125, 0.057281494140625, 0.09698486328125, 0.136688232421875, 0.1763916015625, 0.216094970703125, 0.25579833984375, 0.295501708984375, 0.335205078125, 0.374908447265625, 0.41461181640625, 0.454315185546875, 0.4940185546875, 0.533721923828125, 0.57342529296875, 0.613128662109375, 0.65283203125, 0.692535400390625, 0.73223876953125, 0.771942138671875, 0.8116455078125, 0.851348876953125, 0.89105224609375, 0.930755615234375, 0.970458984375, 1.010162353515625, 1.04986572265625, 1.089569091796875, 1.1292724609375, 1.168975830078125, 1.20867919921875, 1.248382568359375, 1.2880859375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 5.0, 3.0, 10.0, 13.0, 22.0, 33.0, 84.0, 125.0, 180.0, 187.0, 146.0, 86.0, 46.0, 22.0, 19.0, 11.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.760187149047852, -10.333600997924805, -9.907015800476074, -9.480429649353027, -9.05384349822998, -8.62725830078125, -8.200672149658203, -7.774085998535156, -7.347500324249268, -6.920914649963379, -6.494328498840332, -6.067742824554443, -5.641157150268555, -5.214570999145508, -4.787985324859619, -4.3613996505737305, -3.9348134994506836, -3.508227586746216, -3.081641674041748, -2.6550559997558594, -2.2284700870513916, -1.8018841743469238, -1.3752985000610352, -0.9487125873565674, -0.5221266746520996, -0.09554082155227661, 0.3310450315475464, 0.7576308250427246, 1.1842167377471924, 1.6108026504516602, 2.037388324737549, 2.4639742374420166, 2.8905601501464844, 3.317146062850952, 3.74373197555542, 4.170317649841309, 4.5969038009643555, 5.023489475250244, 5.450075149536133, 5.87666130065918, 6.303246974945068, 6.729832649230957, 7.156418800354004, 7.583004474639893, 8.009590148925781, 8.436176300048828, 8.862762451171875, 9.289347648620605, 9.715933799743652, 10.1425199508667, 10.56910514831543, 10.995691299438477, 11.422277450561523, 11.84886360168457, 12.2754487991333, 12.702034950256348, 13.128620147705078, 13.555206298828125, 13.981791496276855, 14.408377647399902, 14.83496379852295, 15.26154899597168, 15.688135147094727, 16.114721298217773, 16.54130744934082]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 2.0, 6.0, 7.0, 8.0, 9.0, 20.0, 11.0, 13.0, 15.0, 36.0, 21.0, 36.0, 39.0, 54.0, 47.0, 41.0, 45.0, 39.0, 54.0, 61.0, 36.0, 34.0, 50.0, 45.0, 42.0, 41.0, 26.0, 20.0, 33.0, 20.0, 15.0, 20.0, 12.0, 12.0, 9.0, 4.0, 3.0, 5.0, 4.0, 3.0, 4.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.060419082641602, -5.824182987213135, -5.58794641494751, -5.351710319519043, -5.115473747253418, -4.879237651824951, -4.643001556396484, -4.406764984130859, -4.170528888702393, -3.9342925548553467, -3.698056221008301, -3.461820125579834, -3.225583791732788, -2.989347457885742, -2.7531113624572754, -2.5168750286102295, -2.2806386947631836, -2.0444023609161377, -1.8081661462783813, -1.571929931640625, -1.335693597793579, -1.0994572639465332, -0.8632210493087769, -0.6269848346710205, -0.3907485008239746, -0.1545122265815735, 0.08172404766082764, 0.31796032190322876, 0.5541965961456299, 0.7904329299926758, 1.0266691446304321, 1.2629053592681885, 1.4991416931152344, 1.7353780269622803, 1.9716142416000366, 2.207850456237793, 2.444086790084839, 2.6803231239318848, 2.9165592193603516, 3.1527955532073975, 3.3890318870544434, 3.6252682209014893, 3.861504554748535, 4.097740650177002, 4.333976745605469, 4.570213317871094, 4.8064494132995605, 5.042685508728027, 5.278922080993652, 5.515158176422119, 5.751394748687744, 5.987630844116211, 6.223867416381836, 6.460103511810303, 6.6963396072387695, 6.9325761795043945, 7.168812274932861, 7.405048370361328, 7.641284942626953, 7.87752103805542, 8.113757133483887, 8.349993705749512, 8.586230278015137, 8.822465896606445, 9.05870246887207]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 3.0, 4.0, 6.0, 10.0, 10.0, 10.0, 29.0, 46.0, 60.0, 73.0, 124.0, 169.0, 240.0, 433.0, 617.0, 1035.0, 1843.0, 3038.0, 5518.0, 10755.0, 20852.0, 41717.0, 83479.0, 159600.0, 244352.0, 217691.0, 125873.0, 63769.0, 31999.0, 16073.0, 8327.0, 4483.0, 2490.0, 1396.0, 890.0, 546.0, 327.0, 220.0, 135.0, 104.0, 56.0, 56.0, 31.0, 19.0, 13.0, 13.0, 8.0, 6.0, 3.0, 4.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.76953125, -0.7445526123046875, -0.719573974609375, -0.6945953369140625, -0.66961669921875, -0.6446380615234375, -0.619659423828125, -0.5946807861328125, -0.5697021484375, -0.5447235107421875, -0.519744873046875, -0.4947662353515625, -0.46978759765625, -0.4448089599609375, -0.419830322265625, -0.3948516845703125, -0.369873046875, -0.3448944091796875, -0.319915771484375, -0.2949371337890625, -0.26995849609375, -0.2449798583984375, -0.220001220703125, -0.1950225830078125, -0.1700439453125, -0.1450653076171875, -0.120086669921875, -0.0951080322265625, -0.07012939453125, -0.0451507568359375, -0.020172119140625, 0.0048065185546875, 0.02978515625, 0.0547637939453125, 0.079742431640625, 0.1047210693359375, 0.12969970703125, 0.1546783447265625, 0.179656982421875, 0.2046356201171875, 0.2296142578125, 0.2545928955078125, 0.279571533203125, 0.3045501708984375, 0.32952880859375, 0.3545074462890625, 0.379486083984375, 0.4044647216796875, 0.429443359375, 0.4544219970703125, 0.479400634765625, 0.5043792724609375, 0.52935791015625, 0.5543365478515625, 0.579315185546875, 0.6042938232421875, 0.6292724609375, 0.6542510986328125, 0.679229736328125, 0.7042083740234375, 0.72918701171875, 0.7541656494140625, 0.779144287109375, 0.8041229248046875, 0.8291015625]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 5.0, 6.0, 7.0, 6.0, 7.0, 13.0, 18.0, 19.0, 25.0, 24.0, 31.0, 33.0, 33.0, 42.0, 45.0, 41.0, 59.0, 58.0, 50.0, 59.0, 52.0, 41.0, 43.0, 52.0, 38.0, 37.0, 27.0, 26.0, 21.0, 24.0, 13.0, 6.0, 11.0, 7.0, 7.0, 5.0, 2.0, 5.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.0009765625, -0.9727554321289062, -0.9445343017578125, -0.9163131713867188, -0.888092041015625, -0.8598709106445312, -0.8316497802734375, -0.8034286499023438, -0.77520751953125, -0.7469863891601562, -0.7187652587890625, -0.6905441284179688, -0.662322998046875, -0.6341018676757812, -0.6058807373046875, -0.5776596069335938, -0.5494384765625, -0.5212173461914062, -0.4929962158203125, -0.46477508544921875, -0.436553955078125, -0.40833282470703125, -0.3801116943359375, -0.35189056396484375, -0.32366943359375, -0.29544830322265625, -0.2672271728515625, -0.23900604248046875, -0.210784912109375, -0.18256378173828125, -0.1543426513671875, -0.12612152099609375, -0.097900390625, -0.06967926025390625, -0.0414581298828125, -0.01323699951171875, 0.014984130859375, 0.04320526123046875, 0.0714263916015625, 0.09964752197265625, 0.12786865234375, 0.15608978271484375, 0.1843109130859375, 0.21253204345703125, 0.240753173828125, 0.26897430419921875, 0.2971954345703125, 0.32541656494140625, 0.3536376953125, 0.38185882568359375, 0.4100799560546875, 0.43830108642578125, 0.466522216796875, 0.49474334716796875, 0.5229644775390625, 0.5511856079101562, 0.57940673828125, 0.6076278686523438, 0.6358489990234375, 0.6640701293945312, 0.692291259765625, 0.7205123901367188, 0.7487335205078125, 0.7769546508789062, 0.80517578125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 6.0, 4.0, 5.0, 14.0, 6.0, 25.0, 22.0, 32.0, 37.0, 52.0, 60.0, 77.0, 120.0, 182.0, 251.0, 357.0, 573.0, 1008.0, 1917.0, 5098.0, 16786.0, 71799.0, 439197.0, 412825.0, 71463.0, 16759.0, 4950.0, 1994.0, 943.0, 577.0, 384.0, 273.0, 160.0, 150.0, 105.0, 76.0, 55.0, 39.0, 43.0, 27.0, 32.0, 18.0, 19.0, 13.0, 4.0, 6.0, 2.0, 3.0, 0.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-1.6162109375, -1.5640716552734375, -1.511932373046875, -1.4597930908203125, -1.40765380859375, -1.3555145263671875, -1.303375244140625, -1.2512359619140625, -1.1990966796875, -1.1469573974609375, -1.094818115234375, -1.0426788330078125, -0.99053955078125, -0.9384002685546875, -0.886260986328125, -0.8341217041015625, -0.781982421875, -0.7298431396484375, -0.677703857421875, -0.6255645751953125, -0.57342529296875, -0.5212860107421875, -0.469146728515625, -0.4170074462890625, -0.3648681640625, -0.3127288818359375, -0.260589599609375, -0.2084503173828125, -0.15631103515625, -0.1041717529296875, -0.052032470703125, 0.0001068115234375, 0.05224609375, 0.1043853759765625, 0.156524658203125, 0.2086639404296875, 0.26080322265625, 0.3129425048828125, 0.365081787109375, 0.4172210693359375, 0.4693603515625, 0.5214996337890625, 0.573638916015625, 0.6257781982421875, 0.67791748046875, 0.7300567626953125, 0.782196044921875, 0.8343353271484375, 0.886474609375, 0.9386138916015625, 0.990753173828125, 1.0428924560546875, 1.09503173828125, 1.1471710205078125, 1.199310302734375, 1.2514495849609375, 1.3035888671875, 1.3557281494140625, 1.407867431640625, 1.4600067138671875, 1.51214599609375, 1.5642852783203125, 1.616424560546875, 1.6685638427734375, 1.720703125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 5.0, 1.0, 1.0, 5.0, 3.0, 7.0, 9.0, 14.0, 16.0, 10.0, 14.0, 19.0, 26.0, 29.0, 48.0, 34.0, 46.0, 38.0, 46.0, 47.0, 58.0, 58.0, 35.0, 55.0, 45.0, 46.0, 34.0, 40.0, 34.0, 35.0, 21.0, 26.0, 19.0, 10.0, 11.0, 11.0, 12.0, 14.0, 9.0, 2.0, 4.0, 5.0, 5.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.71875, -2.6295166015625, -2.540283203125, -2.4510498046875, -2.36181640625, -2.2725830078125, -2.183349609375, -2.0941162109375, -2.0048828125, -1.9156494140625, -1.826416015625, -1.7371826171875, -1.64794921875, -1.5587158203125, -1.469482421875, -1.3802490234375, -1.291015625, -1.2017822265625, -1.112548828125, -1.0233154296875, -0.93408203125, -0.8448486328125, -0.755615234375, -0.6663818359375, -0.5771484375, -0.4879150390625, -0.398681640625, -0.3094482421875, -0.22021484375, -0.1309814453125, -0.041748046875, 0.0474853515625, 0.13671875, 0.2259521484375, 0.315185546875, 0.4044189453125, 0.49365234375, 0.5828857421875, 0.672119140625, 0.7613525390625, 0.8505859375, 0.9398193359375, 1.029052734375, 1.1182861328125, 1.20751953125, 1.2967529296875, 1.385986328125, 1.4752197265625, 1.564453125, 1.6536865234375, 1.742919921875, 1.8321533203125, 1.92138671875, 2.0106201171875, 2.099853515625, 2.1890869140625, 2.2783203125, 2.3675537109375, 2.456787109375, 2.5460205078125, 2.63525390625, 2.7244873046875, 2.813720703125, 2.9029541015625, 2.9921875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 7.0, 4.0, 4.0, 8.0, 11.0, 11.0, 16.0, 25.0, 38.0, 46.0, 51.0, 82.0, 167.0, 259.0, 444.0, 929.0, 1916.0, 4834.0, 13566.0, 44427.0, 174811.0, 628148.0, 126864.0, 33769.0, 10707.0, 3905.0, 1652.0, 757.0, 435.0, 242.0, 133.0, 76.0, 67.0, 48.0, 25.0, 18.0, 10.0, 13.0, 3.0, 9.0, 8.0, 6.0, 6.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.435546875, -0.4221000671386719, -0.40865325927734375, -0.3952064514160156, -0.3817596435546875, -0.3683128356933594, -0.35486602783203125, -0.3414192199707031, -0.327972412109375, -0.3145256042480469, -0.30107879638671875, -0.2876319885253906, -0.2741851806640625, -0.2607383728027344, -0.24729156494140625, -0.23384475708007812, -0.22039794921875, -0.20695114135742188, -0.19350433349609375, -0.18005752563476562, -0.1666107177734375, -0.15316390991210938, -0.13971710205078125, -0.12627029418945312, -0.112823486328125, -0.09937667846679688, -0.08592987060546875, -0.07248306274414062, -0.0590362548828125, -0.045589447021484375, -0.03214263916015625, -0.018695831298828125, -0.0052490234375, 0.008197784423828125, 0.02164459228515625, 0.035091400146484375, 0.0485382080078125, 0.061985015869140625, 0.07543182373046875, 0.08887863159179688, 0.102325439453125, 0.11577224731445312, 0.12921905517578125, 0.14266586303710938, 0.1561126708984375, 0.16955947875976562, 0.18300628662109375, 0.19645309448242188, 0.20989990234375, 0.22334671020507812, 0.23679351806640625, 0.2502403259277344, 0.2636871337890625, 0.2771339416503906, 0.29058074951171875, 0.3040275573730469, 0.317474365234375, 0.3309211730957031, 0.34436798095703125, 0.3578147888183594, 0.3712615966796875, 0.3847084045410156, 0.39815521240234375, 0.4116020202636719, 0.425048828125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 6.0, 4.0, 5.0, 8.0, 9.0, 16.0, 16.0, 23.0, 48.0, 71.0, 89.0, 125.0, 135.0, 119.0, 100.0, 67.0, 44.0, 29.0, 26.0, 23.0, 15.0, 6.0, 4.0, 2.0, 3.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00023281574249267578, -0.00022627972066402435, -0.00021974369883537292, -0.0002132076770067215, -0.00020667165517807007, -0.00020013563334941864, -0.0001935996115207672, -0.00018706358969211578, -0.00018052756786346436, -0.00017399154603481293, -0.0001674555242061615, -0.00016091950237751007, -0.00015438348054885864, -0.00014784745872020721, -0.00014131143689155579, -0.00013477541506290436, -0.00012823939323425293, -0.0001217033714056015, -0.00011516734957695007, -0.00010863132774829865, -0.00010209530591964722, -9.555928409099579e-05, -8.902326226234436e-05, -8.248724043369293e-05, -7.59512186050415e-05, -6.941519677639008e-05, -6.287917494773865e-05, -5.634315311908722e-05, -4.980713129043579e-05, -4.327110946178436e-05, -3.6735087633132935e-05, -3.0199065804481506e-05, -2.3663043975830078e-05, -1.712702214717865e-05, -1.0591000318527222e-05, -4.0549784898757935e-06, 2.4810433387756348e-06, 9.017065167427063e-06, 1.555308699607849e-05, 2.208910882472992e-05, 2.8625130653381348e-05, 3.5161152482032776e-05, 4.1697174310684204e-05, 4.823319613933563e-05, 5.476921796798706e-05, 6.130523979663849e-05, 6.784126162528992e-05, 7.437728345394135e-05, 8.091330528259277e-05, 8.74493271112442e-05, 9.398534893989563e-05, 0.00010052137076854706, 0.00010705739259719849, 0.00011359341442584991, 0.00012012943625450134, 0.00012666545808315277, 0.0001332014799118042, 0.00013973750174045563, 0.00014627352356910706, 0.00015280954539775848, 0.0001593455672264099, 0.00016588158905506134, 0.00017241761088371277, 0.0001789536327123642, 0.00018548965454101562]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 7.0, 5.0, 13.0, 17.0, 21.0, 30.0, 57.0, 113.0, 177.0, 316.0, 620.0, 1553.0, 4644.0, 19043.0, 118800.0, 740728.0, 133734.0, 20729.0, 4984.0, 1585.0, 672.0, 296.0, 175.0, 92.0, 56.0, 34.0, 12.0, 14.0, 8.0, 6.0, 5.0, 6.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.72265625, -0.7038993835449219, -0.6851425170898438, -0.6663856506347656, -0.6476287841796875, -0.6288719177246094, -0.6101150512695312, -0.5913581848144531, -0.572601318359375, -0.5538444519042969, -0.5350875854492188, -0.5163307189941406, -0.4975738525390625, -0.4788169860839844, -0.46006011962890625, -0.4413032531738281, -0.42254638671875, -0.4037895202636719, -0.38503265380859375, -0.3662757873535156, -0.3475189208984375, -0.3287620544433594, -0.31000518798828125, -0.2912483215332031, -0.272491455078125, -0.2537345886230469, -0.23497772216796875, -0.21622085571289062, -0.1974639892578125, -0.17870712280273438, -0.15995025634765625, -0.14119338989257812, -0.1224365234375, -0.10367965698242188, -0.08492279052734375, -0.06616592407226562, -0.0474090576171875, -0.028652191162109375, -0.00989532470703125, 0.008861541748046875, 0.027618408203125, 0.046375274658203125, 0.06513214111328125, 0.08388900756835938, 0.1026458740234375, 0.12140274047851562, 0.14015960693359375, 0.15891647338867188, 0.17767333984375, 0.19643020629882812, 0.21518707275390625, 0.23394393920898438, 0.2527008056640625, 0.2714576721191406, 0.29021453857421875, 0.3089714050292969, 0.327728271484375, 0.3464851379394531, 0.36524200439453125, 0.3839988708496094, 0.4027557373046875, 0.4215126037597656, 0.44026947021484375, 0.4590263366699219, 0.477783203125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 7.0, 6.0, 1.0, 5.0, 11.0, 13.0, 20.0, 29.0, 34.0, 49.0, 82.0, 100.0, 102.0, 102.0, 119.0, 83.0, 77.0, 44.0, 34.0, 23.0, 19.0, 16.0, 12.0, 5.0, 5.0, 4.0, 5.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.59619140625, -0.5746002197265625, -0.553009033203125, -0.5314178466796875, -0.50982666015625, -0.4882354736328125, -0.466644287109375, -0.4450531005859375, -0.4234619140625, -0.4018707275390625, -0.380279541015625, -0.3586883544921875, -0.33709716796875, -0.3155059814453125, -0.293914794921875, -0.2723236083984375, -0.250732421875, -0.2291412353515625, -0.207550048828125, -0.1859588623046875, -0.16436767578125, -0.1427764892578125, -0.121185302734375, -0.0995941162109375, -0.0780029296875, -0.0564117431640625, -0.034820556640625, -0.0132293701171875, 0.00836181640625, 0.0299530029296875, 0.051544189453125, 0.0731353759765625, 0.0947265625, 0.1163177490234375, 0.137908935546875, 0.1595001220703125, 0.18109130859375, 0.2026824951171875, 0.224273681640625, 0.2458648681640625, 0.2674560546875, 0.2890472412109375, 0.310638427734375, 0.3322296142578125, 0.35382080078125, 0.3754119873046875, 0.397003173828125, 0.4185943603515625, 0.440185546875, 0.4617767333984375, 0.483367919921875, 0.5049591064453125, 0.52655029296875, 0.5481414794921875, 0.569732666015625, 0.5913238525390625, 0.6129150390625, 0.6345062255859375, 0.656097412109375, 0.6776885986328125, 0.69927978515625, 0.7208709716796875, 0.742462158203125, 0.7640533447265625, 0.78564453125]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 4.0, 11.0, 7.0, 16.0, 47.0, 63.0, 111.0, 190.0, 291.0, 123.0, 65.0, 36.0, 17.0, 5.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.890586853027344, -19.39608383178711, -18.901580810546875, -18.40707778930664, -17.912574768066406, -17.418071746826172, -16.923568725585938, -16.429065704345703, -15.934563636779785, -15.44006061553955, -14.945557594299316, -14.451054573059082, -13.956552505493164, -13.46204948425293, -12.967546463012695, -12.473043441772461, -11.978540420532227, -11.484037399291992, -10.989534378051758, -10.495031356811523, -10.000528335571289, -9.506025314331055, -9.011523246765137, -8.517020225524902, -8.022517204284668, -7.528014183044434, -7.033511161804199, -6.539008617401123, -6.044505596160889, -5.550002574920654, -5.055500030517578, -4.560997009277344, -4.066493988037109, -3.571990966796875, -3.0774881839752197, -2.5829854011535645, -2.08848237991333, -1.5939793586730957, -1.0994765758514404, -0.6049737930297852, -0.11047077178955078, 0.38403213024139404, 0.8785350322723389, 1.3730379343032837, 1.8675408363342285, 2.362043857574463, 2.856546640396118, 3.3510494232177734, 3.845552444458008, 4.340055465698242, 4.834558486938477, 5.329061031341553, 5.823564052581787, 6.3180670738220215, 6.812569618225098, 7.307072639465332, 7.801575660705566, 8.2960786819458, 8.790581703186035, 9.28508472442627, 9.779586791992188, 10.274089813232422, 10.768592834472656, 11.26309585571289, 11.757598876953125]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 5.0, 2.0, 2.0, 6.0, 2.0, 10.0, 6.0, 12.0, 20.0, 14.0, 16.0, 19.0, 23.0, 18.0, 25.0, 26.0, 21.0, 41.0, 46.0, 46.0, 95.0, 115.0, 70.0, 49.0, 34.0, 35.0, 29.0, 31.0, 26.0, 29.0, 21.0, 19.0, 13.0, 10.0, 11.0, 10.0, 6.0, 10.0, 6.0, 7.0, 5.0, 5.0, 3.0, 6.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.874667167663574, -9.539567947387695, -9.204469680786133, -8.86937141418457, -8.534272193908691, -8.199172973632812, -7.86407470703125, -7.528975963592529, -7.193877220153809, -6.858778476715088, -6.523679733276367, -6.1885809898376465, -5.853482246398926, -5.518383502960205, -5.183284759521484, -4.848186016082764, -4.513087272644043, -4.177988529205322, -3.8428897857666016, -3.507791042327881, -3.17269229888916, -2.8375935554504395, -2.5024948120117188, -2.167396068572998, -1.8322973251342773, -1.4971985816955566, -1.162099838256836, -0.8270010948181152, -0.49190235137939453, -0.15680360794067383, 0.17829513549804688, 0.5133938789367676, 0.8484916687011719, 1.1835904121398926, 1.5186891555786133, 1.853787899017334, 2.1888866424560547, 2.5239853858947754, 2.859084129333496, 3.194182872772217, 3.5292816162109375, 3.864380359649658, 4.199479103088379, 4.5345778465271, 4.86967658996582, 5.204775333404541, 5.539874076843262, 5.874972820281982, 6.210071563720703, 6.545170307159424, 6.8802690505981445, 7.215367794036865, 7.550466537475586, 7.885565280914307, 8.220664024353027, 8.555763244628906, 8.890861511230469, 9.225959777832031, 9.56105899810791, 9.896158218383789, 10.231256484985352, 10.566354751586914, 10.901453971862793, 11.236553192138672, 11.571651458740234]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 3.0, 8.0, 12.0, 21.0, 18.0, 25.0, 42.0, 60.0, 88.0, 153.0, 223.0, 380.0, 596.0, 1143.0, 2323.0, 5442.0, 14369.0, 42554.0, 144867.0, 488748.0, 1296868.0, 1409177.0, 549073.0, 161110.0, 48314.0, 16360.0, 6426.0, 2770.0, 1377.0, 691.0, 373.0, 221.0, 133.0, 99.0, 63.0, 52.0, 22.0, 24.0, 17.0, 13.0, 5.0, 6.0, 3.0, 5.0, 6.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.65185546875, -0.6327133178710938, -0.6135711669921875, -0.5944290161132812, -0.575286865234375, -0.5561447143554688, -0.5370025634765625, -0.5178604125976562, -0.49871826171875, -0.47957611083984375, -0.4604339599609375, -0.44129180908203125, -0.422149658203125, -0.40300750732421875, -0.3838653564453125, -0.36472320556640625, -0.3455810546875, -0.32643890380859375, -0.3072967529296875, -0.28815460205078125, -0.269012451171875, -0.24987030029296875, -0.2307281494140625, -0.21158599853515625, -0.19244384765625, -0.17330169677734375, -0.1541595458984375, -0.13501739501953125, -0.115875244140625, -0.09673309326171875, -0.0775909423828125, -0.05844879150390625, -0.039306640625, -0.02016448974609375, -0.0010223388671875, 0.01811981201171875, 0.037261962890625, 0.05640411376953125, 0.0755462646484375, 0.09468841552734375, 0.11383056640625, 0.13297271728515625, 0.1521148681640625, 0.17125701904296875, 0.190399169921875, 0.20954132080078125, 0.2286834716796875, 0.24782562255859375, 0.2669677734375, 0.28610992431640625, 0.3052520751953125, 0.32439422607421875, 0.343536376953125, 0.36267852783203125, 0.3818206787109375, 0.40096282958984375, 0.42010498046875, 0.43924713134765625, 0.4583892822265625, 0.47753143310546875, 0.496673583984375, 0.5158157348632812, 0.5349578857421875, 0.5541000366210938, 0.5732421875]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 1.0, 5.0, 4.0, 8.0, 7.0, 6.0, 15.0, 10.0, 26.0, 17.0, 29.0, 28.0, 36.0, 36.0, 47.0, 37.0, 54.0, 45.0, 52.0, 57.0, 41.0, 48.0, 44.0, 52.0, 37.0, 30.0, 37.0, 35.0, 35.0, 26.0, 19.0, 15.0, 10.0, 16.0, 8.0, 9.0, 6.0, 5.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.96484375, -0.9371109008789062, -0.9093780517578125, -0.8816452026367188, -0.853912353515625, -0.8261795043945312, -0.7984466552734375, -0.7707138061523438, -0.74298095703125, -0.7152481079101562, -0.6875152587890625, -0.6597824096679688, -0.632049560546875, -0.6043167114257812, -0.5765838623046875, -0.5488510131835938, -0.5211181640625, -0.49338531494140625, -0.4656524658203125, -0.43791961669921875, -0.410186767578125, -0.38245391845703125, -0.3547210693359375, -0.32698822021484375, -0.29925537109375, -0.27152252197265625, -0.2437896728515625, -0.21605682373046875, -0.188323974609375, -0.16059112548828125, -0.1328582763671875, -0.10512542724609375, -0.077392578125, -0.04965972900390625, -0.0219268798828125, 0.00580596923828125, 0.033538818359375, 0.06127166748046875, 0.0890045166015625, 0.11673736572265625, 0.14447021484375, 0.17220306396484375, 0.1999359130859375, 0.22766876220703125, 0.255401611328125, 0.28313446044921875, 0.3108673095703125, 0.33860015869140625, 0.3663330078125, 0.39406585693359375, 0.4217987060546875, 0.44953155517578125, 0.477264404296875, 0.5049972534179688, 0.5327301025390625, 0.5604629516601562, 0.58819580078125, 0.6159286499023438, 0.6436614990234375, 0.6713943481445312, 0.699127197265625, 0.7268600463867188, 0.7545928955078125, 0.7823257446289062, 0.81005859375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 0.0, 1.0, 5.0, 4.0, 4.0, 5.0, 10.0, 22.0, 21.0, 18.0, 38.0, 84.0, 159.0, 279.0, 655.0, 2138.0, 12122.0, 157344.0, 3646417.0, 349956.0, 19916.0, 3219.0, 982.0, 398.0, 201.0, 107.0, 62.0, 35.0, 30.0, 17.0, 12.0, 10.0, 3.0, 6.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9404296875, -1.8770294189453125, -1.813629150390625, -1.7502288818359375, -1.68682861328125, -1.6234283447265625, -1.560028076171875, -1.4966278076171875, -1.4332275390625, -1.3698272705078125, -1.306427001953125, -1.2430267333984375, -1.17962646484375, -1.1162261962890625, -1.052825927734375, -0.9894256591796875, -0.926025390625, -0.8626251220703125, -0.799224853515625, -0.7358245849609375, -0.67242431640625, -0.6090240478515625, -0.545623779296875, -0.4822235107421875, -0.4188232421875, -0.3554229736328125, -0.292022705078125, -0.2286224365234375, -0.16522216796875, -0.1018218994140625, -0.038421630859375, 0.0249786376953125, 0.08837890625, 0.1517791748046875, 0.215179443359375, 0.2785797119140625, 0.34197998046875, 0.4053802490234375, 0.468780517578125, 0.5321807861328125, 0.5955810546875, 0.6589813232421875, 0.722381591796875, 0.7857818603515625, 0.84918212890625, 0.9125823974609375, 0.975982666015625, 1.0393829345703125, 1.102783203125, 1.1661834716796875, 1.229583740234375, 1.2929840087890625, 1.35638427734375, 1.4197845458984375, 1.483184814453125, 1.5465850830078125, 1.6099853515625, 1.6733856201171875, 1.736785888671875, 1.8001861572265625, 1.86358642578125, 1.9269866943359375, 1.990386962890625, 2.0537872314453125, 2.1171875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 6.0, 3.0, 5.0, 5.0, 14.0, 5.0, 9.0, 14.0, 21.0, 26.0, 39.0, 76.0, 105.0, 146.0, 210.0, 312.0, 416.0, 503.0, 515.0, 498.0, 333.0, 230.0, 163.0, 115.0, 61.0, 60.0, 40.0, 41.0, 30.0, 24.0, 16.0, 5.0, 10.0, 5.0, 4.0, 4.0, 3.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.92041015625, -0.8788375854492188, -0.8372650146484375, -0.7956924438476562, -0.754119873046875, -0.7125473022460938, -0.6709747314453125, -0.6294021606445312, -0.58782958984375, -0.5462570190429688, -0.5046844482421875, -0.46311187744140625, -0.421539306640625, -0.37996673583984375, -0.3383941650390625, -0.29682159423828125, -0.2552490234375, -0.21367645263671875, -0.1721038818359375, -0.13053131103515625, -0.088958740234375, -0.04738616943359375, -0.0058135986328125, 0.03575897216796875, 0.07733154296875, 0.11890411376953125, 0.1604766845703125, 0.20204925537109375, 0.243621826171875, 0.28519439697265625, 0.3267669677734375, 0.36833953857421875, 0.409912109375, 0.45148468017578125, 0.4930572509765625, 0.5346298217773438, 0.576202392578125, 0.6177749633789062, 0.6593475341796875, 0.7009201049804688, 0.74249267578125, 0.7840652465820312, 0.8256378173828125, 0.8672103881835938, 0.908782958984375, 0.9503555297851562, 0.9919281005859375, 1.0335006713867188, 1.0750732421875, 1.1166458129882812, 1.1582183837890625, 1.1997909545898438, 1.241363525390625, 1.2829360961914062, 1.3245086669921875, 1.3660812377929688, 1.40765380859375, 1.4492263793945312, 1.4907989501953125, 1.5323715209960938, 1.573944091796875, 1.6155166625976562, 1.6570892333984375, 1.6986618041992188, 1.740234375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 9.0, 22.0, 31.0, 70.0, 106.0, 165.0, 183.0, 148.0, 113.0, 62.0, 31.0, 12.0, 15.0, 7.0, 9.0, 5.0, 1.0, 4.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.9807820320129395, -6.546756267547607, -6.112730503082275, -5.678705215454102, -5.2446794509887695, -4.8106536865234375, -4.3766279220581055, -3.9426021575927734, -3.5085763931274414, -3.0745506286621094, -2.6405248641967773, -2.2064993381500244, -1.7724735736846924, -1.3384478092193604, -0.9044222831726074, -0.4703965187072754, -0.03637075424194336, 0.3976549506187439, 0.8316806554794312, 1.2657063007354736, 1.6997320652008057, 2.1337578296661377, 2.5677833557128906, 3.0018091201782227, 3.4358348846435547, 3.8698606491088867, 4.303886413574219, 4.737912178039551, 5.171937942504883, 5.605963706970215, 6.039988994598389, 6.474014759063721, 6.908041000366211, 7.342066764831543, 7.776092529296875, 8.210118293762207, 8.644144058227539, 9.078169822692871, 9.512195587158203, 9.946220397949219, 10.380247116088867, 10.8142728805542, 11.248298645019531, 11.682324409484863, 12.116350173950195, 12.550375938415527, 12.98440170288086, 13.418426513671875, 13.852452278137207, 14.286478042602539, 14.720503807067871, 15.154529571533203, 15.588555335998535, 16.022581100463867, 16.456605911254883, 16.89063262939453, 17.324657440185547, 17.758682250976562, 18.19270896911621, 18.626733779907227, 19.060760498046875, 19.49478530883789, 19.92881202697754, 20.362836837768555, 20.796863555908203]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 3.0, 6.0, 4.0, 10.0, 16.0, 15.0, 16.0, 24.0, 33.0, 46.0, 39.0, 35.0, 35.0, 35.0, 33.0, 47.0, 44.0, 39.0, 47.0, 50.0, 55.0, 46.0, 33.0, 31.0, 29.0, 37.0, 31.0, 36.0, 32.0, 24.0, 13.0, 17.0, 7.0, 11.0, 7.0, 4.0, 5.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.798887252807617, -6.553752422332764, -6.308617115020752, -6.063482284545898, -5.818346977233887, -5.573212146759033, -5.32807731628418, -5.082942008972168, -4.8378071784973145, -4.592672348022461, -4.347537040710449, -4.102402210235596, -3.857267141342163, -3.6121320724487305, -3.366997241973877, -3.1218621730804443, -2.8767271041870117, -2.631592035293579, -2.3864569664001465, -2.141322135925293, -1.8961870670318604, -1.6510519981384277, -1.4059170484542847, -1.1607820987701416, -0.915647029876709, -0.6705120205879211, -0.4253770112991333, -0.18024200201034546, 0.06489300727844238, 0.310028076171875, 0.5551630258560181, 0.8002979755401611, 1.0454330444335938, 1.2905681133270264, 1.5357030630111694, 1.7808380126953125, 2.025973081588745, 2.2711081504821777, 2.5162429809570312, 2.761378049850464, 3.0065131187438965, 3.251648187637329, 3.4967832565307617, 3.7419180870056152, 3.987053155899048, 4.2321882247924805, 4.477323055267334, 4.7224578857421875, 4.967593193054199, 5.212728023529053, 5.4578633308410645, 5.702998161315918, 5.94813346862793, 6.193268299102783, 6.438403129577637, 6.683538436889648, 6.928673267364502, 7.1738080978393555, 7.418943405151367, 7.664078235626221, 7.909213066101074, 8.154348373413086, 8.399483680725098, 8.644618034362793, 8.889753341674805]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 9.0, 6.0, 9.0, 16.0, 27.0, 42.0, 77.0, 106.0, 182.0, 267.0, 471.0, 800.0, 1531.0, 2796.0, 5459.0, 10795.0, 23141.0, 52855.0, 131360.0, 304760.0, 294359.0, 125284.0, 50382.0, 21973.0, 10445.0, 5163.0, 2746.0, 1502.0, 803.0, 448.0, 280.0, 176.0, 97.0, 56.0, 53.0, 30.0, 15.0, 9.0, 10.0, 7.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.154296875, -1.1144561767578125, -1.074615478515625, -1.0347747802734375, -0.99493408203125, -0.9550933837890625, -0.915252685546875, -0.8754119873046875, -0.8355712890625, -0.7957305908203125, -0.755889892578125, -0.7160491943359375, -0.67620849609375, -0.6363677978515625, -0.596527099609375, -0.5566864013671875, -0.516845703125, -0.4770050048828125, -0.437164306640625, -0.3973236083984375, -0.35748291015625, -0.3176422119140625, -0.277801513671875, -0.2379608154296875, -0.1981201171875, -0.1582794189453125, -0.118438720703125, -0.0785980224609375, -0.03875732421875, 0.0010833740234375, 0.040924072265625, 0.0807647705078125, 0.12060546875, 0.1604461669921875, 0.200286865234375, 0.2401275634765625, 0.27996826171875, 0.3198089599609375, 0.359649658203125, 0.3994903564453125, 0.4393310546875, 0.4791717529296875, 0.519012451171875, 0.5588531494140625, 0.59869384765625, 0.6385345458984375, 0.678375244140625, 0.7182159423828125, 0.758056640625, 0.7978973388671875, 0.837738037109375, 0.8775787353515625, 0.91741943359375, 0.9572601318359375, 0.997100830078125, 1.0369415283203125, 1.0767822265625, 1.1166229248046875, 1.156463623046875, 1.1963043212890625, 1.23614501953125, 1.2759857177734375, 1.315826416015625, 1.3556671142578125, 1.3955078125]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 5.0, 6.0, 6.0, 8.0, 9.0, 13.0, 22.0, 29.0, 20.0, 35.0, 37.0, 59.0, 57.0, 40.0, 60.0, 56.0, 56.0, 67.0, 52.0, 50.0, 55.0, 42.0, 35.0, 42.0, 32.0, 27.0, 20.0, 16.0, 10.0, 9.0, 10.0, 9.0, 2.0, 6.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.935546875, -0.9017791748046875, -0.868011474609375, -0.8342437744140625, -0.80047607421875, -0.7667083740234375, -0.732940673828125, -0.6991729736328125, -0.6654052734375, -0.6316375732421875, -0.597869873046875, -0.5641021728515625, -0.53033447265625, -0.4965667724609375, -0.462799072265625, -0.4290313720703125, -0.395263671875, -0.3614959716796875, -0.327728271484375, -0.2939605712890625, -0.26019287109375, -0.2264251708984375, -0.192657470703125, -0.1588897705078125, -0.1251220703125, -0.0913543701171875, -0.057586669921875, -0.0238189697265625, 0.00994873046875, 0.0437164306640625, 0.077484130859375, 0.1112518310546875, 0.14501953125, 0.1787872314453125, 0.212554931640625, 0.2463226318359375, 0.28009033203125, 0.3138580322265625, 0.347625732421875, 0.3813934326171875, 0.4151611328125, 0.4489288330078125, 0.482696533203125, 0.5164642333984375, 0.55023193359375, 0.5839996337890625, 0.617767333984375, 0.6515350341796875, 0.685302734375, 0.7190704345703125, 0.752838134765625, 0.7866058349609375, 0.82037353515625, 0.8541412353515625, 0.887908935546875, 0.9216766357421875, 0.9554443359375, 0.9892120361328125, 1.022979736328125, 1.0567474365234375, 1.09051513671875, 1.1242828369140625, 1.158050537109375, 1.1918182373046875, 1.2255859375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 3.0, 2.0, 12.0, 8.0, 14.0, 15.0, 17.0, 27.0, 34.0, 51.0, 74.0, 78.0, 106.0, 132.0, 212.0, 298.0, 418.0, 629.0, 968.0, 1907.0, 4633.0, 18695.0, 123896.0, 756737.0, 113111.0, 17126.0, 4498.0, 1830.0, 957.0, 649.0, 377.0, 285.0, 199.0, 134.0, 99.0, 79.0, 66.0, 52.0, 32.0, 36.0, 17.0, 15.0, 7.0, 5.0, 11.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.236328125, -2.165283203125, -2.09423828125, -2.023193359375, -1.9521484375, -1.881103515625, -1.81005859375, -1.739013671875, -1.66796875, -1.596923828125, -1.52587890625, -1.454833984375, -1.3837890625, -1.312744140625, -1.24169921875, -1.170654296875, -1.099609375, -1.028564453125, -0.95751953125, -0.886474609375, -0.8154296875, -0.744384765625, -0.67333984375, -0.602294921875, -0.53125, -0.460205078125, -0.38916015625, -0.318115234375, -0.2470703125, -0.176025390625, -0.10498046875, -0.033935546875, 0.037109375, 0.108154296875, 0.17919921875, 0.250244140625, 0.3212890625, 0.392333984375, 0.46337890625, 0.534423828125, 0.60546875, 0.676513671875, 0.74755859375, 0.818603515625, 0.8896484375, 0.960693359375, 1.03173828125, 1.102783203125, 1.173828125, 1.244873046875, 1.31591796875, 1.386962890625, 1.4580078125, 1.529052734375, 1.60009765625, 1.671142578125, 1.7421875, 1.813232421875, 1.88427734375, 1.955322265625, 2.0263671875, 2.097412109375, 2.16845703125, 2.239501953125, 2.310546875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 3.0, 2.0, 4.0, 3.0, 10.0, 10.0, 13.0, 12.0, 13.0, 14.0, 24.0, 26.0, 32.0, 32.0, 32.0, 46.0, 43.0, 44.0, 56.0, 45.0, 63.0, 62.0, 53.0, 51.0, 53.0, 41.0, 33.0, 21.0, 30.0, 27.0, 20.0, 17.0, 10.0, 11.0, 16.0, 7.0, 6.0, 4.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.1796875, -3.078155517578125, -2.97662353515625, -2.875091552734375, -2.7735595703125, -2.672027587890625, -2.57049560546875, -2.468963623046875, -2.367431640625, -2.265899658203125, -2.16436767578125, -2.062835693359375, -1.9613037109375, -1.859771728515625, -1.75823974609375, -1.656707763671875, -1.55517578125, -1.453643798828125, -1.35211181640625, -1.250579833984375, -1.1490478515625, -1.047515869140625, -0.94598388671875, -0.844451904296875, -0.742919921875, -0.641387939453125, -0.53985595703125, -0.438323974609375, -0.3367919921875, -0.235260009765625, -0.13372802734375, -0.032196044921875, 0.0693359375, 0.170867919921875, 0.27239990234375, 0.373931884765625, 0.4754638671875, 0.576995849609375, 0.67852783203125, 0.780059814453125, 0.881591796875, 0.983123779296875, 1.08465576171875, 1.186187744140625, 1.2877197265625, 1.389251708984375, 1.49078369140625, 1.592315673828125, 1.69384765625, 1.795379638671875, 1.89691162109375, 1.998443603515625, 2.0999755859375, 2.201507568359375, 2.30303955078125, 2.404571533203125, 2.506103515625, 2.607635498046875, 2.70916748046875, 2.810699462890625, 2.9122314453125, 3.013763427734375, 3.11529541015625, 3.216827392578125, 3.318359375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 4.0, 4.0, 5.0, 8.0, 7.0, 8.0, 21.0, 43.0, 30.0, 64.0, 109.0, 147.0, 286.0, 522.0, 1136.0, 2931.0, 9559.0, 45292.0, 308668.0, 610829.0, 52413.0, 10858.0, 3146.0, 1145.0, 560.0, 302.0, 163.0, 95.0, 61.0, 50.0, 28.0, 22.0, 10.0, 6.0, 5.0, 7.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.492431640625, -0.4754753112792969, -0.45851898193359375, -0.4415626525878906, -0.4246063232421875, -0.4076499938964844, -0.39069366455078125, -0.3737373352050781, -0.356781005859375, -0.3398246765136719, -0.32286834716796875, -0.3059120178222656, -0.2889556884765625, -0.2719993591308594, -0.25504302978515625, -0.23808670043945312, -0.22113037109375, -0.20417404174804688, -0.18721771240234375, -0.17026138305664062, -0.1533050537109375, -0.13634872436523438, -0.11939239501953125, -0.10243606567382812, -0.085479736328125, -0.06852340698242188, -0.05156707763671875, -0.034610748291015625, -0.0176544189453125, -0.000698089599609375, 0.01625823974609375, 0.033214569091796875, 0.0501708984375, 0.06712722778320312, 0.08408355712890625, 0.10103988647460938, 0.1179962158203125, 0.13495254516601562, 0.15190887451171875, 0.16886520385742188, 0.185821533203125, 0.20277786254882812, 0.21973419189453125, 0.23669052124023438, 0.2536468505859375, 0.2706031799316406, 0.28755950927734375, 0.3045158386230469, 0.32147216796875, 0.3384284973144531, 0.35538482666015625, 0.3723411560058594, 0.3892974853515625, 0.4062538146972656, 0.42321014404296875, 0.4401664733886719, 0.457122802734375, 0.4740791320800781, 0.49103546142578125, 0.5079917907714844, 0.5249481201171875, 0.5419044494628906, 0.5588607788085938, 0.5758171081542969, 0.5927734375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 3.0, 5.0, 3.0, 7.0, 7.0, 9.0, 12.0, 11.0, 18.0, 22.0, 24.0, 27.0, 29.0, 44.0, 74.0, 69.0, 77.0, 82.0, 88.0, 82.0, 66.0, 46.0, 38.0, 20.0, 29.0, 18.0, 24.0, 16.0, 9.0, 9.0, 4.0, 8.0, 6.0, 4.0, 3.0, 1.0, 7.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001481771469116211, -0.00014331750571727753, -0.00013845786452293396, -0.0001335982233285904, -0.00012873858213424683, -0.00012387894093990326, -0.00011901929974555969, -0.00011415965855121613, -0.00010930001735687256, -0.00010444037616252899, -9.958073496818542e-05, -9.472109377384186e-05, -8.986145257949829e-05, -8.500181138515472e-05, -8.014217019081116e-05, -7.528252899646759e-05, -7.042288780212402e-05, -6.556324660778046e-05, -6.070360541343689e-05, -5.584396421909332e-05, -5.0984323024749756e-05, -4.612468183040619e-05, -4.126504063606262e-05, -3.6405399441719055e-05, -3.154575824737549e-05, -2.668611705303192e-05, -2.1826475858688354e-05, -1.6966834664344788e-05, -1.210719347000122e-05, -7.247552275657654e-06, -2.387911081314087e-06, 2.47173011302948e-06, 7.331371307373047e-06, 1.2191012501716614e-05, 1.705065369606018e-05, 2.1910294890403748e-05, 2.6769936084747314e-05, 3.162957727909088e-05, 3.648921847343445e-05, 4.1348859667778015e-05, 4.620850086212158e-05, 5.106814205646515e-05, 5.5927783250808716e-05, 6.078742444515228e-05, 6.564706563949585e-05, 7.050670683383942e-05, 7.536634802818298e-05, 8.022598922252655e-05, 8.508563041687012e-05, 8.994527161121368e-05, 9.480491280555725e-05, 9.966455399990082e-05, 0.00010452419519424438, 0.00010938383638858795, 0.00011424347758293152, 0.00011910311877727509, 0.00012396275997161865, 0.00012882240116596222, 0.00013368204236030579, 0.00013854168355464935, 0.00014340132474899292, 0.0001482609659433365, 0.00015312060713768005, 0.00015798024833202362, 0.0001628398895263672]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 7.0, 9.0, 5.0, 16.0, 27.0, 26.0, 41.0, 49.0, 110.0, 146.0, 234.0, 382.0, 708.0, 1440.0, 3633.0, 12015.0, 55845.0, 604014.0, 305091.0, 48002.0, 10509.0, 3282.0, 1325.0, 629.0, 394.0, 206.0, 137.0, 83.0, 45.0, 46.0, 24.0, 18.0, 14.0, 12.0, 11.0, 9.0, 3.0, 2.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.55810546875, -0.5430030822753906, -0.5279006958007812, -0.5127983093261719, -0.4976959228515625, -0.4825935363769531, -0.46749114990234375, -0.4523887634277344, -0.437286376953125, -0.4221839904785156, -0.40708160400390625, -0.3919792175292969, -0.3768768310546875, -0.3617744445800781, -0.34667205810546875, -0.3315696716308594, -0.31646728515625, -0.3013648986816406, -0.28626251220703125, -0.2711601257324219, -0.2560577392578125, -0.24095535278320312, -0.22585296630859375, -0.21075057983398438, -0.195648193359375, -0.18054580688476562, -0.16544342041015625, -0.15034103393554688, -0.1352386474609375, -0.12013626098632812, -0.10503387451171875, -0.08993148803710938, -0.0748291015625, -0.059726715087890625, -0.04462432861328125, -0.029521942138671875, -0.0144195556640625, 0.000682830810546875, 0.01578521728515625, 0.030887603759765625, 0.045989990234375, 0.061092376708984375, 0.07619476318359375, 0.09129714965820312, 0.1063995361328125, 0.12150192260742188, 0.13660430908203125, 0.15170669555664062, 0.16680908203125, 0.18191146850585938, 0.19701385498046875, 0.21211624145507812, 0.2272186279296875, 0.24232101440429688, 0.25742340087890625, 0.2725257873535156, 0.287628173828125, 0.3027305603027344, 0.31783294677734375, 0.3329353332519531, 0.3480377197265625, 0.3631401062011719, 0.37824249267578125, 0.3933448791503906, 0.408447265625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 8.0, 7.0, 6.0, 15.0, 18.0, 19.0, 22.0, 25.0, 31.0, 28.0, 53.0, 65.0, 62.0, 88.0, 75.0, 82.0, 62.0, 45.0, 54.0, 44.0, 41.0, 29.0, 17.0, 17.0, 14.0, 13.0, 9.0, 9.0, 11.0, 8.0, 4.0, 8.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0], "bins": [-0.462158203125, -0.44886016845703125, -0.4355621337890625, -0.42226409912109375, -0.408966064453125, -0.39566802978515625, -0.3823699951171875, -0.36907196044921875, -0.35577392578125, -0.34247589111328125, -0.3291778564453125, -0.31587982177734375, -0.302581787109375, -0.28928375244140625, -0.2759857177734375, -0.26268768310546875, -0.2493896484375, -0.23609161376953125, -0.2227935791015625, -0.20949554443359375, -0.196197509765625, -0.18289947509765625, -0.1696014404296875, -0.15630340576171875, -0.14300537109375, -0.12970733642578125, -0.1164093017578125, -0.10311126708984375, -0.089813232421875, -0.07651519775390625, -0.0632171630859375, -0.04991912841796875, -0.03662109375, -0.02332305908203125, -0.0100250244140625, 0.00327301025390625, 0.016571044921875, 0.02986907958984375, 0.0431671142578125, 0.05646514892578125, 0.06976318359375, 0.08306121826171875, 0.0963592529296875, 0.10965728759765625, 0.122955322265625, 0.13625335693359375, 0.1495513916015625, 0.16284942626953125, 0.1761474609375, 0.18944549560546875, 0.2027435302734375, 0.21604156494140625, 0.229339599609375, 0.24263763427734375, 0.2559356689453125, 0.26923370361328125, 0.28253173828125, 0.29582977294921875, 0.3091278076171875, 0.32242584228515625, 0.335723876953125, 0.34902191162109375, 0.3623199462890625, 0.37561798095703125, 0.388916015625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 5.0, 0.0, 3.0, 2.0, 11.0, 17.0, 23.0, 29.0, 66.0, 96.0, 148.0, 333.0, 131.0, 61.0, 46.0, 16.0, 12.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-22.230846405029297, -21.75246238708496, -21.274078369140625, -20.79569435119629, -20.317310333251953, -19.838924407958984, -19.36054039001465, -18.882156372070312, -18.403772354125977, -17.92538833618164, -17.447004318237305, -16.96862030029297, -16.490234375, -16.011850357055664, -15.533466339111328, -15.055082321166992, -14.576698303222656, -14.09831428527832, -13.619930267333984, -13.141545295715332, -12.663161277770996, -12.18477725982666, -11.706392288208008, -11.228008270263672, -10.749624252319336, -10.271240234375, -9.792856216430664, -9.314471244812012, -8.836087226867676, -8.35770320892334, -7.879318714141846, -7.400934219360352, -6.922549247741699, -6.444165229797363, -5.965780735015869, -5.487396240234375, -5.009012222290039, -4.530628204345703, -4.052243709564209, -3.573859453201294, -3.095475196838379, -2.617090940475464, -2.138706684112549, -1.6603224277496338, -1.1819381713867188, -0.7035539150238037, -0.22516965866088867, 0.25321459770202637, 0.7315988540649414, 1.2099831104278564, 1.6883673667907715, 2.1667516231536865, 2.6451358795166016, 3.1235201358795166, 3.6019043922424316, 4.080288887023926, 4.558672904968262, 5.037056922912598, 5.515441417694092, 5.993825912475586, 6.472209930419922, 6.950593948364258, 7.428978443145752, 7.907362937927246, 8.385746955871582]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 5.0, 4.0, 3.0, 7.0, 11.0, 8.0, 12.0, 11.0, 14.0, 15.0, 21.0, 18.0, 21.0, 31.0, 39.0, 38.0, 31.0, 52.0, 145.0, 142.0, 66.0, 45.0, 39.0, 22.0, 31.0, 27.0, 28.0, 21.0, 16.0, 8.0, 9.0, 11.0, 10.0, 13.0, 5.0, 8.0, 5.0, 4.0, 1.0, 5.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-13.262158393859863, -12.884936332702637, -12.50771427154541, -12.130491256713867, -11.75326919555664, -11.376047134399414, -10.998825073242188, -10.621603012084961, -10.244380950927734, -9.867158889770508, -9.489936828613281, -9.112714767456055, -8.735491752624512, -8.358269691467285, -7.981047630310059, -7.603825569152832, -7.226602554321289, -6.8493804931640625, -6.472157955169678, -6.094935894012451, -5.717713356018066, -5.34049129486084, -4.963269233703613, -4.586047172546387, -4.208824634552002, -3.8316023349761963, -3.4543800354003906, -3.077157974243164, -2.6999356746673584, -2.3227133750915527, -1.9454913139343262, -1.5682690143585205, -1.1910476684570312, -0.8138254284858704, -0.4366031885147095, -0.05938100814819336, 0.3178412914276123, 0.695063591003418, 1.0722856521606445, 1.4495079517364502, 1.8267302513122559, 2.2039525508880615, 2.581174850463867, 2.9583969116210938, 3.3356192111968994, 3.712841510772705, 4.090063571929932, 4.467286109924316, 4.844508171081543, 5.2217302322387695, 5.598952770233154, 5.976174831390381, 6.353397369384766, 6.730619430541992, 7.107841491699219, 7.485063552856445, 7.86228609085083, 8.239508628845215, 8.616730690002441, 8.993952751159668, 9.371174812316895, 9.748397827148438, 10.125619888305664, 10.50284194946289, 10.880064010620117]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 11.0, 12.0, 11.0, 25.0, 38.0, 77.0, 108.0, 182.0, 287.0, 615.0, 1106.0, 2196.0, 5468.0, 18216.0, 92787.0, 529604.0, 1851096.0, 1328823.0, 291840.0, 51548.0, 12515.0, 3966.0, 1652.0, 957.0, 455.0, 285.0, 170.0, 86.0, 54.0, 34.0, 27.0, 7.0, 10.0, 9.0, 7.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.87109375, -0.83453369140625, -0.7979736328125, -0.76141357421875, -0.724853515625, -0.68829345703125, -0.6517333984375, -0.61517333984375, -0.57861328125, -0.54205322265625, -0.5054931640625, -0.46893310546875, -0.432373046875, -0.39581298828125, -0.3592529296875, -0.32269287109375, -0.2861328125, -0.24957275390625, -0.2130126953125, -0.17645263671875, -0.139892578125, -0.10333251953125, -0.0667724609375, -0.03021240234375, 0.00634765625, 0.04290771484375, 0.0794677734375, 0.11602783203125, 0.152587890625, 0.18914794921875, 0.2257080078125, 0.26226806640625, 0.298828125, 0.33538818359375, 0.3719482421875, 0.40850830078125, 0.445068359375, 0.48162841796875, 0.5181884765625, 0.55474853515625, 0.59130859375, 0.62786865234375, 0.6644287109375, 0.70098876953125, 0.737548828125, 0.77410888671875, 0.8106689453125, 0.84722900390625, 0.8837890625, 0.92034912109375, 0.9569091796875, 0.99346923828125, 1.030029296875, 1.06658935546875, 1.1031494140625, 1.13970947265625, 1.17626953125, 1.21282958984375, 1.2493896484375, 1.28594970703125, 1.322509765625, 1.35906982421875, 1.3956298828125, 1.43218994140625, 1.46875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 3.0, 3.0, 5.0, 3.0, 4.0, 13.0, 12.0, 27.0, 22.0, 26.0, 25.0, 26.0, 38.0, 36.0, 55.0, 39.0, 43.0, 40.0, 50.0, 75.0, 57.0, 48.0, 54.0, 41.0, 29.0, 44.0, 41.0, 29.0, 23.0, 19.0, 13.0, 9.0, 15.0, 7.0, 4.0, 10.0, 2.0, 2.0, 6.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.9443359375, -0.9166183471679688, -0.8889007568359375, -0.8611831665039062, -0.833465576171875, -0.8057479858398438, -0.7780303955078125, -0.7503128051757812, -0.72259521484375, -0.6948776245117188, -0.6671600341796875, -0.6394424438476562, -0.611724853515625, -0.5840072631835938, -0.5562896728515625, -0.5285720825195312, -0.5008544921875, -0.47313690185546875, -0.4454193115234375, -0.41770172119140625, -0.389984130859375, -0.36226654052734375, -0.3345489501953125, -0.30683135986328125, -0.27911376953125, -0.25139617919921875, -0.2236785888671875, -0.19596099853515625, -0.168243408203125, -0.14052581787109375, -0.1128082275390625, -0.08509063720703125, -0.057373046875, -0.02965545654296875, -0.0019378662109375, 0.02577972412109375, 0.053497314453125, 0.08121490478515625, 0.1089324951171875, 0.13665008544921875, 0.16436767578125, 0.19208526611328125, 0.2198028564453125, 0.24752044677734375, 0.275238037109375, 0.30295562744140625, 0.3306732177734375, 0.35839080810546875, 0.3861083984375, 0.41382598876953125, 0.4415435791015625, 0.46926116943359375, 0.496978759765625, 0.5246963500976562, 0.5524139404296875, 0.5801315307617188, 0.60784912109375, 0.6355667114257812, 0.6632843017578125, 0.6910018920898438, 0.718719482421875, 0.7464370727539062, 0.7741546630859375, 0.8018722534179688, 0.82958984375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 0.0, 5.0, 4.0, 6.0, 9.0, 14.0, 18.0, 22.0, 38.0, 48.0, 76.0, 130.0, 200.0, 394.0, 743.0, 1641.0, 4814.0, 33327.0, 3487256.0, 643389.0, 15830.0, 3496.0, 1349.0, 605.0, 347.0, 187.0, 108.0, 73.0, 52.0, 24.0, 15.0, 24.0, 14.0, 8.0, 5.0, 5.0, 3.0, 3.0, 0.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.998046875, -3.87628173828125, -3.7545166015625, -3.63275146484375, -3.510986328125, -3.38922119140625, -3.2674560546875, -3.14569091796875, -3.02392578125, -2.90216064453125, -2.7803955078125, -2.65863037109375, -2.536865234375, -2.41510009765625, -2.2933349609375, -2.17156982421875, -2.0498046875, -1.92803955078125, -1.8062744140625, -1.68450927734375, -1.562744140625, -1.44097900390625, -1.3192138671875, -1.19744873046875, -1.07568359375, -0.95391845703125, -0.8321533203125, -0.71038818359375, -0.588623046875, -0.46685791015625, -0.3450927734375, -0.22332763671875, -0.1015625, 0.02020263671875, 0.1419677734375, 0.26373291015625, 0.385498046875, 0.50726318359375, 0.6290283203125, 0.75079345703125, 0.87255859375, 0.99432373046875, 1.1160888671875, 1.23785400390625, 1.359619140625, 1.48138427734375, 1.6031494140625, 1.72491455078125, 1.8466796875, 1.96844482421875, 2.0902099609375, 2.21197509765625, 2.333740234375, 2.45550537109375, 2.5772705078125, 2.69903564453125, 2.82080078125, 2.94256591796875, 3.0643310546875, 3.18609619140625, 3.307861328125, 3.42962646484375, 3.5513916015625, 3.67315673828125, 3.794921875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 10.0, 6.0, 7.0, 5.0, 16.0, 14.0, 21.0, 36.0, 46.0, 73.0, 108.0, 146.0, 208.0, 328.0, 430.0, 545.0, 509.0, 400.0, 319.0, 225.0, 166.0, 124.0, 92.0, 55.0, 50.0, 29.0, 24.0, 25.0, 15.0, 14.0, 3.0, 8.0, 6.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.03125, -1.958160400390625, -1.88507080078125, -1.811981201171875, -1.7388916015625, -1.665802001953125, -1.59271240234375, -1.519622802734375, -1.446533203125, -1.373443603515625, -1.30035400390625, -1.227264404296875, -1.1541748046875, -1.081085205078125, -1.00799560546875, -0.934906005859375, -0.86181640625, -0.788726806640625, -0.71563720703125, -0.642547607421875, -0.5694580078125, -0.496368408203125, -0.42327880859375, -0.350189208984375, -0.277099609375, -0.204010009765625, -0.13092041015625, -0.057830810546875, 0.0152587890625, 0.088348388671875, 0.16143798828125, 0.234527587890625, 0.3076171875, 0.380706787109375, 0.45379638671875, 0.526885986328125, 0.5999755859375, 0.673065185546875, 0.74615478515625, 0.819244384765625, 0.892333984375, 0.965423583984375, 1.03851318359375, 1.111602783203125, 1.1846923828125, 1.257781982421875, 1.33087158203125, 1.403961181640625, 1.47705078125, 1.550140380859375, 1.62322998046875, 1.696319580078125, 1.7694091796875, 1.842498779296875, 1.91558837890625, 1.988677978515625, 2.061767578125, 2.134857177734375, 2.20794677734375, 2.281036376953125, 2.3541259765625, 2.427215576171875, 2.50030517578125, 2.573394775390625, 2.646484375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 4.0, 4.0, 2.0, 2.0, 8.0, 7.0, 22.0, 36.0, 66.0, 119.0, 232.0, 222.0, 147.0, 55.0, 34.0, 19.0, 12.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-27.069202423095703, -25.97530174255371, -24.88140106201172, -23.787500381469727, -22.693599700927734, -21.59969711303711, -20.505796432495117, -19.411895751953125, -18.317995071411133, -17.22409439086914, -16.13019371032715, -15.03629207611084, -13.942391395568848, -12.848490715026855, -11.754589080810547, -10.660688400268555, -9.566787719726562, -8.47288703918457, -7.37898588180542, -6.2850847244262695, -5.191184043884277, -4.097283363342285, -3.0033822059631348, -1.9094810485839844, -0.8155803680419922, 0.2783205509185791, 1.3722214698791504, 2.4661223888397217, 3.560023307800293, 4.653923988342285, 5.7478251457214355, 6.841726303100586, 7.935626983642578, 9.02952766418457, 10.123428344726562, 11.217329978942871, 12.311230659484863, 13.405131340026855, 14.499032974243164, 15.592933654785156, 16.68683433532715, 17.78073501586914, 18.874635696411133, 19.968536376953125, 21.06243896484375, 22.15633773803711, 23.250240325927734, 24.344141006469727, 25.43804168701172, 26.53194236755371, 27.625843048095703, 28.719743728637695, 29.813644409179688, 30.907546997070312, 32.00144577026367, 33.0953483581543, 34.189247131347656, 35.28314971923828, 36.37704849243164, 37.470951080322266, 38.564849853515625, 39.65875244140625, 40.75265121459961, 41.846553802490234, 42.94045639038086]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 2.0, 4.0, 2.0, 4.0, 6.0, 12.0, 7.0, 17.0, 17.0, 8.0, 18.0, 25.0, 15.0, 24.0, 21.0, 36.0, 32.0, 40.0, 36.0, 45.0, 42.0, 54.0, 58.0, 61.0, 53.0, 49.0, 39.0, 35.0, 27.0, 23.0, 36.0, 24.0, 29.0, 15.0, 13.0, 18.0, 12.0, 17.0, 4.0, 7.0, 1.0, 3.0, 2.0, 5.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-15.017311096191406, -14.561007499694824, -14.104703903198242, -13.648401260375977, -13.192097663879395, -12.735794067382812, -12.27949047088623, -11.823186874389648, -11.366883277893066, -10.910579681396484, -10.454276084899902, -9.99797248840332, -9.541669845581055, -9.085366249084473, -8.62906265258789, -8.172759056091309, -7.716455936431885, -7.260152339935303, -6.803849220275879, -6.347545623779297, -5.891242027282715, -5.434938430786133, -4.978635311126709, -4.522331714630127, -4.066028594970703, -3.6097252368927, -3.153421640396118, -2.6971182823181152, -2.240814685821533, -1.7845113277435303, -1.3282079696655273, -0.8719043731689453, -0.4156007766723633, 0.04070267081260681, 0.4970061182975769, 0.9533095359802246, 1.409613013267517, 1.8659164905548096, 2.3222198486328125, 2.7785234451293945, 3.2348268032073975, 3.6911301612854004, 4.147433757781982, 4.603736877441406, 5.060040473937988, 5.51634407043457, 5.972647666931152, 6.428951263427734, 6.885254383087158, 7.34155797958374, 7.797861099243164, 8.254164695739746, 8.710468292236328, 9.16677188873291, 9.623075485229492, 10.079378128051758, 10.53568172454834, 10.991985321044922, 11.448288917541504, 11.904592514038086, 12.360895156860352, 12.817198753356934, 13.273502349853516, 13.729805946350098, 14.18610954284668]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 4.0, 5.0, 7.0, 5.0, 12.0, 11.0, 16.0, 11.0, 36.0, 49.0, 68.0, 110.0, 177.0, 266.0, 442.0, 849.0, 1585.0, 3361.0, 7566.0, 20300.0, 65552.0, 288216.0, 511094.0, 100767.0, 28941.0, 10323.0, 4307.0, 1975.0, 1088.0, 530.0, 327.0, 195.0, 124.0, 78.0, 40.0, 35.0, 19.0, 22.0, 9.0, 7.0, 6.0, 4.0, 5.0, 3.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5224609375, -1.47198486328125, -1.4215087890625, -1.37103271484375, -1.320556640625, -1.27008056640625, -1.2196044921875, -1.16912841796875, -1.11865234375, -1.06817626953125, -1.0177001953125, -0.96722412109375, -0.916748046875, -0.86627197265625, -0.8157958984375, -0.76531982421875, -0.71484375, -0.66436767578125, -0.6138916015625, -0.56341552734375, -0.512939453125, -0.46246337890625, -0.4119873046875, -0.36151123046875, -0.31103515625, -0.26055908203125, -0.2100830078125, -0.15960693359375, -0.109130859375, -0.05865478515625, -0.0081787109375, 0.04229736328125, 0.0927734375, 0.14324951171875, 0.1937255859375, 0.24420166015625, 0.294677734375, 0.34515380859375, 0.3956298828125, 0.44610595703125, 0.49658203125, 0.54705810546875, 0.5975341796875, 0.64801025390625, 0.698486328125, 0.74896240234375, 0.7994384765625, 0.84991455078125, 0.900390625, 0.95086669921875, 1.0013427734375, 1.05181884765625, 1.102294921875, 1.15277099609375, 1.2032470703125, 1.25372314453125, 1.30419921875, 1.35467529296875, 1.4051513671875, 1.45562744140625, 1.506103515625, 1.55657958984375, 1.6070556640625, 1.65753173828125, 1.7080078125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 2.0, 2.0, 4.0, 6.0, 5.0, 12.0, 17.0, 11.0, 33.0, 32.0, 36.0, 41.0, 47.0, 52.0, 65.0, 56.0, 71.0, 74.0, 70.0, 64.0, 74.0, 49.0, 36.0, 37.0, 17.0, 27.0, 16.0, 9.0, 13.0, 7.0, 8.0, 5.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.2607421875, -1.2172393798828125, -1.173736572265625, -1.1302337646484375, -1.08673095703125, -1.0432281494140625, -0.999725341796875, -0.9562225341796875, -0.9127197265625, -0.8692169189453125, -0.825714111328125, -0.7822113037109375, -0.73870849609375, -0.6952056884765625, -0.651702880859375, -0.6082000732421875, -0.564697265625, -0.5211944580078125, -0.477691650390625, -0.4341888427734375, -0.39068603515625, -0.3471832275390625, -0.303680419921875, -0.2601776123046875, -0.2166748046875, -0.1731719970703125, -0.129669189453125, -0.0861663818359375, -0.04266357421875, 0.0008392333984375, 0.044342041015625, 0.0878448486328125, 0.13134765625, 0.1748504638671875, 0.218353271484375, 0.2618560791015625, 0.30535888671875, 0.3488616943359375, 0.392364501953125, 0.4358673095703125, 0.4793701171875, 0.5228729248046875, 0.566375732421875, 0.6098785400390625, 0.65338134765625, 0.6968841552734375, 0.740386962890625, 0.7838897705078125, 0.827392578125, 0.8708953857421875, 0.914398193359375, 0.9579010009765625, 1.00140380859375, 1.0449066162109375, 1.088409423828125, 1.1319122314453125, 1.1754150390625, 1.2189178466796875, 1.262420654296875, 1.3059234619140625, 1.34942626953125, 1.3929290771484375, 1.436431884765625, 1.4799346923828125, 1.5234375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 2.0, 4.0, 9.0, 7.0, 16.0, 25.0, 22.0, 37.0, 48.0, 68.0, 118.0, 199.0, 320.0, 615.0, 1335.0, 4374.0, 30102.0, 887942.0, 110053.0, 9457.0, 2136.0, 745.0, 414.0, 231.0, 91.0, 73.0, 35.0, 28.0, 22.0, 16.0, 3.0, 2.0, 1.0, 5.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.47265625, -2.383514404296875, -2.29437255859375, -2.205230712890625, -2.1160888671875, -2.026947021484375, -1.93780517578125, -1.848663330078125, -1.759521484375, -1.670379638671875, -1.58123779296875, -1.492095947265625, -1.4029541015625, -1.313812255859375, -1.22467041015625, -1.135528564453125, -1.04638671875, -0.957244873046875, -0.86810302734375, -0.778961181640625, -0.6898193359375, -0.600677490234375, -0.51153564453125, -0.422393798828125, -0.333251953125, -0.244110107421875, -0.15496826171875, -0.065826416015625, 0.0233154296875, 0.112457275390625, 0.20159912109375, 0.290740966796875, 0.3798828125, 0.469024658203125, 0.55816650390625, 0.647308349609375, 0.7364501953125, 0.825592041015625, 0.91473388671875, 1.003875732421875, 1.093017578125, 1.182159423828125, 1.27130126953125, 1.360443115234375, 1.4495849609375, 1.538726806640625, 1.62786865234375, 1.717010498046875, 1.80615234375, 1.895294189453125, 1.98443603515625, 2.073577880859375, 2.1627197265625, 2.251861572265625, 2.34100341796875, 2.430145263671875, 2.519287109375, 2.608428955078125, 2.69757080078125, 2.786712646484375, 2.8758544921875, 2.964996337890625, 3.05413818359375, 3.143280029296875, 3.232421875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 0.0, 2.0, 6.0, 3.0, 10.0, 5.0, 13.0, 14.0, 21.0, 22.0, 16.0, 19.0, 27.0, 21.0, 34.0, 40.0, 44.0, 40.0, 65.0, 89.0, 69.0, 73.0, 73.0, 51.0, 49.0, 33.0, 25.0, 23.0, 22.0, 18.0, 22.0, 12.0, 9.0, 4.0, 9.0, 2.0, 6.0, 3.0, 1.0, 2.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.37890625, -4.252410888671875, -4.12591552734375, -3.999420166015625, -3.8729248046875, -3.746429443359375, -3.61993408203125, -3.493438720703125, -3.366943359375, -3.240447998046875, -3.11395263671875, -2.987457275390625, -2.8609619140625, -2.734466552734375, -2.60797119140625, -2.481475830078125, -2.35498046875, -2.228485107421875, -2.10198974609375, -1.975494384765625, -1.8489990234375, -1.722503662109375, -1.59600830078125, -1.469512939453125, -1.343017578125, -1.216522216796875, -1.09002685546875, -0.963531494140625, -0.8370361328125, -0.710540771484375, -0.58404541015625, -0.457550048828125, -0.3310546875, -0.204559326171875, -0.07806396484375, 0.048431396484375, 0.1749267578125, 0.301422119140625, 0.42791748046875, 0.554412841796875, 0.680908203125, 0.807403564453125, 0.93389892578125, 1.060394287109375, 1.1868896484375, 1.313385009765625, 1.43988037109375, 1.566375732421875, 1.69287109375, 1.819366455078125, 1.94586181640625, 2.072357177734375, 2.1988525390625, 2.325347900390625, 2.45184326171875, 2.578338623046875, 2.704833984375, 2.831329345703125, 2.95782470703125, 3.084320068359375, 3.2108154296875, 3.337310791015625, 3.46380615234375, 3.590301513671875, 3.716796875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 3.0, 1.0, 5.0, 2.0, 3.0, 5.0, 11.0, 6.0, 8.0, 15.0, 19.0, 29.0, 38.0, 71.0, 140.0, 292.0, 562.0, 1562.0, 5998.0, 37034.0, 911672.0, 77768.0, 9427.0, 2391.0, 736.0, 328.0, 168.0, 91.0, 62.0, 39.0, 13.0, 10.0, 7.0, 13.0, 7.0, 8.0, 2.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.67333984375, -0.6533279418945312, -0.6333160400390625, -0.6133041381835938, -0.593292236328125, -0.5732803344726562, -0.5532684326171875, -0.5332565307617188, -0.51324462890625, -0.49323272705078125, -0.4732208251953125, -0.45320892333984375, -0.433197021484375, -0.41318511962890625, -0.3931732177734375, -0.37316131591796875, -0.3531494140625, -0.33313751220703125, -0.3131256103515625, -0.29311370849609375, -0.273101806640625, -0.25308990478515625, -0.2330780029296875, -0.21306610107421875, -0.19305419921875, -0.17304229736328125, -0.1530303955078125, -0.13301849365234375, -0.113006591796875, -0.09299468994140625, -0.0729827880859375, -0.05297088623046875, -0.032958984375, -0.01294708251953125, 0.0070648193359375, 0.02707672119140625, 0.047088623046875, 0.06710052490234375, 0.0871124267578125, 0.10712432861328125, 0.12713623046875, 0.14714813232421875, 0.1671600341796875, 0.18717193603515625, 0.207183837890625, 0.22719573974609375, 0.2472076416015625, 0.26721954345703125, 0.2872314453125, 0.30724334716796875, 0.3272552490234375, 0.34726715087890625, 0.367279052734375, 0.38729095458984375, 0.4073028564453125, 0.42731475830078125, 0.44732666015625, 0.46733856201171875, 0.4873504638671875, 0.5073623657226562, 0.527374267578125, 0.5473861694335938, 0.5673980712890625, 0.5874099731445312, 0.607421875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 7.0, 4.0, 4.0, 5.0, 6.0, 5.0, 11.0, 13.0, 7.0, 14.0, 12.0, 20.0, 31.0, 28.0, 53.0, 87.0, 88.0, 100.0, 101.0, 103.0, 70.0, 39.0, 37.0, 23.0, 22.0, 20.0, 19.0, 8.0, 11.0, 8.0, 7.0, 6.0, 4.0, 10.0, 2.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.00012183189392089844, -0.00011773966252803802, -0.00011364743113517761, -0.0001095551997423172, -0.00010546296834945679, -0.00010137073695659637, -9.727850556373596e-05, -9.318627417087555e-05, -8.909404277801514e-05, -8.500181138515472e-05, -8.090957999229431e-05, -7.68173485994339e-05, -7.272511720657349e-05, -6.863288581371307e-05, -6.454065442085266e-05, -6.044842302799225e-05, -5.6356191635131836e-05, -5.226396024227142e-05, -4.817172884941101e-05, -4.40794974565506e-05, -3.9987266063690186e-05, -3.589503467082977e-05, -3.180280327796936e-05, -2.7710571885108948e-05, -2.3618340492248535e-05, -1.9526109099388123e-05, -1.543387770652771e-05, -1.1341646313667297e-05, -7.249414920806885e-06, -3.157183527946472e-06, 9.350478649139404e-07, 5.027279257774353e-06, 9.119510650634766e-06, 1.3211742043495178e-05, 1.730397343635559e-05, 2.1396204829216003e-05, 2.5488436222076416e-05, 2.958066761493683e-05, 3.367289900779724e-05, 3.7765130400657654e-05, 4.1857361793518066e-05, 4.594959318637848e-05, 5.004182457923889e-05, 5.4134055972099304e-05, 5.822628736495972e-05, 6.231851875782013e-05, 6.641075015068054e-05, 7.050298154354095e-05, 7.459521293640137e-05, 7.868744432926178e-05, 8.277967572212219e-05, 8.68719071149826e-05, 9.096413850784302e-05, 9.505636990070343e-05, 9.914860129356384e-05, 0.00010324083268642426, 0.00010733306407928467, 0.00011142529547214508, 0.00011551752686500549, 0.0001196097582578659, 0.00012370198965072632, 0.00012779422104358673, 0.00013188645243644714, 0.00013597868382930756, 0.00014007091522216797]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 4.0, 5.0, 10.0, 16.0, 14.0, 33.0, 46.0, 80.0, 150.0, 264.0, 533.0, 1228.0, 3337.0, 12206.0, 72257.0, 874306.0, 66706.0, 11647.0, 3323.0, 1288.0, 488.0, 245.0, 146.0, 99.0, 48.0, 23.0, 9.0, 11.0, 9.0, 7.0, 3.0, 2.0, 2.0, 3.0, 5.0, 1.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.397216796875, -0.384185791015625, -0.37115478515625, -0.358123779296875, -0.3450927734375, -0.332061767578125, -0.31903076171875, -0.305999755859375, -0.29296875, -0.279937744140625, -0.26690673828125, -0.253875732421875, -0.2408447265625, -0.227813720703125, -0.21478271484375, -0.201751708984375, -0.188720703125, -0.175689697265625, -0.16265869140625, -0.149627685546875, -0.1365966796875, -0.123565673828125, -0.11053466796875, -0.097503662109375, -0.08447265625, -0.071441650390625, -0.05841064453125, -0.045379638671875, -0.0323486328125, -0.019317626953125, -0.00628662109375, 0.006744384765625, 0.019775390625, 0.032806396484375, 0.04583740234375, 0.058868408203125, 0.0718994140625, 0.084930419921875, 0.09796142578125, 0.110992431640625, 0.1240234375, 0.137054443359375, 0.15008544921875, 0.163116455078125, 0.1761474609375, 0.189178466796875, 0.20220947265625, 0.215240478515625, 0.228271484375, 0.241302490234375, 0.25433349609375, 0.267364501953125, 0.2803955078125, 0.293426513671875, 0.30645751953125, 0.319488525390625, 0.33251953125, 0.345550537109375, 0.35858154296875, 0.371612548828125, 0.3846435546875, 0.397674560546875, 0.41070556640625, 0.423736572265625, 0.436767578125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 1.0, 2.0, 0.0, 4.0, 5.0, 3.0, 4.0, 6.0, 7.0, 8.0, 14.0, 15.0, 20.0, 20.0, 37.0, 38.0, 59.0, 62.0, 74.0, 114.0, 107.0, 85.0, 72.0, 62.0, 38.0, 34.0, 23.0, 19.0, 15.0, 13.0, 12.0, 5.0, 7.0, 2.0, 8.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.36083984375, -0.3484230041503906, -0.33600616455078125, -0.3235893249511719, -0.3111724853515625, -0.2987556457519531, -0.28633880615234375, -0.2739219665527344, -0.261505126953125, -0.24908828735351562, -0.23667144775390625, -0.22425460815429688, -0.2118377685546875, -0.19942092895507812, -0.18700408935546875, -0.17458724975585938, -0.16217041015625, -0.14975357055664062, -0.13733673095703125, -0.12491989135742188, -0.1125030517578125, -0.10008621215820312, -0.08766937255859375, -0.07525253295898438, -0.062835693359375, -0.050418853759765625, -0.03800201416015625, -0.025585174560546875, -0.0131683349609375, -0.000751495361328125, 0.01166534423828125, 0.024082183837890625, 0.0364990234375, 0.048915863037109375, 0.06133270263671875, 0.07374954223632812, 0.0861663818359375, 0.09858322143554688, 0.11100006103515625, 0.12341690063476562, 0.135833740234375, 0.14825057983398438, 0.16066741943359375, 0.17308425903320312, 0.1855010986328125, 0.19791793823242188, 0.21033477783203125, 0.22275161743164062, 0.23516845703125, 0.24758529663085938, 0.26000213623046875, 0.2724189758300781, 0.2848358154296875, 0.2972526550292969, 0.30966949462890625, 0.3220863342285156, 0.334503173828125, 0.3469200134277344, 0.35933685302734375, 0.3717536926269531, 0.3841705322265625, 0.3965873718261719, 0.40900421142578125, 0.4214210510253906, 0.433837890625]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 7.0, 5.0, 37.0, 78.0, 378.0, 415.0, 71.0, 14.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.805763244628906, -48.72344970703125, -47.64113235473633, -46.55881881713867, -45.47650146484375, -44.394187927246094, -43.31187057495117, -42.229557037353516, -41.147239685058594, -40.06492614746094, -38.982608795166016, -37.90029525756836, -36.81797790527344, -35.73566436767578, -34.65334701538086, -33.5710334777832, -32.48871612548828, -31.406400680541992, -30.324085235595703, -29.241769790649414, -28.159454345703125, -27.077138900756836, -25.994823455810547, -24.91250991821289, -23.830196380615234, -22.747880935668945, -21.665565490722656, -20.583250045776367, -19.500934600830078, -18.41861915588379, -17.3363037109375, -16.253990173339844, -15.171670913696289, -14.08935546875, -13.007040023803711, -11.924724578857422, -10.842409133911133, -9.760093688964844, -8.677779197692871, -7.595463752746582, -6.513148307800293, -5.430832862854004, -4.348517417907715, -3.266202449798584, -2.183887004852295, -1.1015715599060059, -0.019256591796875, 1.063058853149414, 2.145374298095703, 3.227689743041992, 4.310005187988281, 5.392320156097412, 6.474635601043701, 7.55695104598999, 8.639266014099121, 9.72158145904541, 10.8038969039917, 11.886212348937988, 12.968527793884277, 14.05084228515625, 15.133157730102539, 16.215473175048828, 17.297788619995117, 18.380104064941406, 19.462419509887695]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 2.0, 5.0, 0.0, 2.0, 7.0, 7.0, 8.0, 6.0, 3.0, 15.0, 18.0, 20.0, 12.0, 15.0, 12.0, 17.0, 18.0, 19.0, 17.0, 25.0, 33.0, 126.0, 207.0, 133.0, 37.0, 23.0, 31.0, 24.0, 14.0, 20.0, 10.0, 16.0, 15.0, 13.0, 5.0, 9.0, 6.0, 14.0, 9.0, 4.0, 5.0, 5.0, 6.0, 2.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.094806671142578, -8.814618110656738, -8.534429550170898, -8.254241943359375, -7.974053382873535, -7.693864822387695, -7.4136762619018555, -7.133487701416016, -6.853299617767334, -6.573111057281494, -6.2929229736328125, -6.012734413146973, -5.732545852661133, -5.452357769012451, -5.172169208526611, -4.89198112487793, -4.61179256439209, -4.33160400390625, -4.051415920257568, -3.7712273597717285, -3.4910390377044678, -3.210850715637207, -2.930662155151367, -2.6504738330841064, -2.3702855110168457, -2.090097188949585, -1.8099087476730347, -1.5297203063964844, -1.2495319843292236, -0.9693436622619629, -0.6891552209854126, -0.4089667797088623, -0.12877845764160156, 0.15140992403030396, 0.4315983057022095, 0.711786687374115, 0.9919750690460205, 1.2721633911132812, 1.5523518323898315, 1.8325402736663818, 2.1127285957336426, 2.3929169178009033, 2.673105239868164, 2.953293800354004, 3.2334821224212646, 3.5136704444885254, 3.7938590049743652, 4.074047088623047, 4.354235649108887, 4.634424209594727, 4.914612293243408, 5.194800853729248, 5.47498893737793, 5.7551774978637695, 6.035366058349609, 6.315554618835449, 6.595742702484131, 6.875931262969971, 7.156119346618652, 7.436307907104492, 7.716496467590332, 7.996684551239014, 8.276872634887695, 8.557061195373535, 8.837249755859375]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 3.0, 6.0, 6.0, 13.0, 13.0, 22.0, 18.0, 17.0, 18.0, 29.0, 26.0, 27.0, 33.0, 41.0, 93.0, 237.0, 140.0, 52.0, 35.0, 36.0, 23.0, 21.0, 16.0, 16.0, 12.0, 9.0, 2.0, 6.0, 10.0, 5.0, 6.0, 4.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.90234375, -0.87091064453125, -0.8394775390625, -0.80804443359375, -0.776611328125, -0.74517822265625, -0.7137451171875, -0.68231201171875, -0.65087890625, -0.61944580078125, -0.5880126953125, -0.55657958984375, -0.525146484375, -0.49371337890625, -0.4622802734375, -0.43084716796875, -0.3994140625, -0.36798095703125, -0.3365478515625, -0.30511474609375, -0.273681640625, -0.24224853515625, -0.2108154296875, -0.17938232421875, -0.14794921875, -0.11651611328125, -0.0850830078125, -0.05364990234375, -0.022216796875, 0.00921630859375, 0.0406494140625, 0.07208251953125, 0.103515625, 0.13494873046875, 0.1663818359375, 0.19781494140625, 0.229248046875, 0.26068115234375, 0.2921142578125, 0.32354736328125, 0.35498046875, 0.38641357421875, 0.4178466796875, 0.44927978515625, 0.480712890625, 0.51214599609375, 0.5435791015625, 0.57501220703125, 0.6064453125, 0.63787841796875, 0.6693115234375, 0.70074462890625, 0.732177734375, 0.76361083984375, 0.7950439453125, 0.82647705078125, 0.85791015625, 0.88934326171875, 0.9207763671875, 0.95220947265625, 0.983642578125, 1.01507568359375, 1.0465087890625, 1.07794189453125, 1.109375]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 0.0, 7.0, 4.0, 7.0, 6.0, 15.0, 19.0, 25.0, 40.0, 97.0, 215.0, 858.0, 7478.0, 8368660.0, 9792.0, 930.0, 224.0, 91.0, 34.0, 24.0, 12.0, 24.0, 8.0, 7.0, 9.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-17.864316940307617, -17.375450134277344, -16.88658332824707, -16.397714614868164, -15.90884780883789, -15.419981002807617, -14.931114196777344, -14.44224739074707, -13.95337963104248, -13.464512825012207, -12.975645065307617, -12.486778259277344, -11.99791145324707, -11.50904369354248, -11.020176887512207, -10.531309127807617, -10.042442321777344, -9.55357551574707, -9.06470775604248, -8.575840950012207, -8.086973190307617, -7.598106384277344, -7.10923957824707, -6.620372295379639, -6.131505012512207, -5.642637729644775, -5.153770446777344, -4.66490364074707, -4.176036357879639, -3.687169075012207, -3.1983020305633545, -2.709434986114502, -2.2205677032470703, -1.7317005395889282, -1.2428333759307861, -0.753966212272644, -0.26509904861450195, 0.2237682342529297, 0.7126352787017822, 1.2015023231506348, 1.6903696060180664, 2.179236888885498, 2.6681039333343506, 3.156970977783203, 3.6458382606506348, 4.134705543518066, 4.62357234954834, 5.1124396324157715, 5.601306915283203, 6.090174198150635, 6.579041481018066, 7.06790828704834, 7.5567755699157715, 8.045642852783203, 8.534509658813477, 9.02337646484375, 9.51224422454834, 10.001111030578613, 10.489978790283203, 10.978845596313477, 11.46771240234375, 11.95658016204834, 12.445446968078613, 12.934314727783203, 13.423181533813477]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 5.0, 3.0, 4.0, 2.0, 2.0, 1.0, 6.0, 2.0, 3.0, 2.0, 7.0, 6.0, 3.0, 8.0, 0.0, 6.0, 7.0, 1.0, 6.0, 2.0, 0.0, 1.0, 5.0, 1.0, 0.0, 1.0, 8.0, 1.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.9409661293029785, -5.722023963928223, -5.503082275390625, -5.284140110015869, -5.065197944641113, -4.846256256103516, -4.62731409072876, -4.408371925354004, -4.189430236816406, -3.9704883098602295, -3.7515463829040527, -3.532604217529297, -3.31366229057312, -3.0947203636169434, -2.8757781982421875, -2.6568362712860107, -2.437894344329834, -2.2189524173736572, -2.0000104904174805, -1.7810683250427246, -1.5621263980865479, -1.343184471130371, -1.1242424249649048, -0.9053003787994385, -0.6863584518432617, -0.4674164652824402, -0.24847447872161865, -0.02953249216079712, 0.18940949440002441, 0.40835142135620117, 0.6272934675216675, 0.8462355136871338, 1.0651779174804688, 1.2841198444366455, 1.5030618906021118, 1.7220039367675781, 1.9409458637237549, 2.1598877906799316, 2.3788299560546875, 2.5977718830108643, 2.816713809967041, 3.0356557369232178, 3.2545976638793945, 3.4735398292541504, 3.692481756210327, 3.911423683166504, 4.13036584854126, 4.349308013916016, 4.568249702453613, 4.787191867828369, 5.006133556365967, 5.225075721740723, 5.44401741027832, 5.662959575653076, 5.881901741027832, 6.10084342956543, 6.3197855949401855, 6.538727760314941, 6.757669448852539, 6.976611614227295, 7.195553779602051, 7.414495468139648, 7.633437633514404, 7.85237979888916, 8.071321487426758]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 1.0, 6.0, 6.0, 8.0, 26.0, 27.0, 44.0, 44.0, 106.0, 131.0, 238.0, 472.0, 1226.0, 4297.0, 17810.0, 85839.0, 269715.0, 111618.0, 23823.0, 5862.0, 1620.0, 602.0, 288.0, 142.0, 90.0, 63.0, 42.0, 50.0, 22.0, 11.0, 12.0, 8.0, 11.0, 1.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.8203125, -8.5318603515625, -8.243408203125, -7.9549560546875, -7.66650390625, -7.3780517578125, -7.089599609375, -6.8011474609375, -6.5126953125, -6.2242431640625, -5.935791015625, -5.6473388671875, -5.35888671875, -5.0704345703125, -4.781982421875, -4.4935302734375, -4.205078125, -3.9166259765625, -3.628173828125, -3.3397216796875, -3.05126953125, -2.7628173828125, -2.474365234375, -2.1859130859375, -1.8974609375, -1.6090087890625, -1.320556640625, -1.0321044921875, -0.74365234375, -0.4552001953125, -0.166748046875, 0.1217041015625, 0.41015625, 0.6986083984375, 0.987060546875, 1.2755126953125, 1.56396484375, 1.8524169921875, 2.140869140625, 2.4293212890625, 2.7177734375, 3.0062255859375, 3.294677734375, 3.5831298828125, 3.87158203125, 4.1600341796875, 4.448486328125, 4.7369384765625, 5.025390625, 5.3138427734375, 5.602294921875, 5.8907470703125, 6.17919921875, 6.4676513671875, 6.756103515625, 7.0445556640625, 7.3330078125, 7.6214599609375, 7.909912109375, 8.1983642578125, 8.48681640625, 8.7752685546875, 9.063720703125, 9.3521728515625, 9.640625]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 7.0, 4.0, 11.0, 19.0, 17.0, 27.0, 25.0, 41.0, 56.0, 62.0, 73.0, 90.0, 89.0, 83.0, 80.0, 75.0, 65.0, 44.0, 35.0, 21.0, 28.0, 17.0, 6.0, 5.0, 11.0, 4.0, 2.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.455078125, -1.407073974609375, -1.35906982421875, -1.311065673828125, -1.2630615234375, -1.215057373046875, -1.16705322265625, -1.119049072265625, -1.071044921875, -1.023040771484375, -0.97503662109375, -0.927032470703125, -0.8790283203125, -0.831024169921875, -0.78302001953125, -0.735015869140625, -0.68701171875, -0.639007568359375, -0.59100341796875, -0.542999267578125, -0.4949951171875, -0.446990966796875, -0.39898681640625, -0.350982666015625, -0.302978515625, -0.254974365234375, -0.20697021484375, -0.158966064453125, -0.1109619140625, -0.062957763671875, -0.01495361328125, 0.033050537109375, 0.0810546875, 0.129058837890625, 0.17706298828125, 0.225067138671875, 0.2730712890625, 0.321075439453125, 0.36907958984375, 0.417083740234375, 0.465087890625, 0.513092041015625, 0.56109619140625, 0.609100341796875, 0.6571044921875, 0.705108642578125, 0.75311279296875, 0.801116943359375, 0.84912109375, 0.897125244140625, 0.94512939453125, 0.993133544921875, 1.0411376953125, 1.089141845703125, 1.13714599609375, 1.185150146484375, 1.233154296875, 1.281158447265625, 1.32916259765625, 1.377166748046875, 1.4251708984375, 1.473175048828125, 1.52117919921875, 1.569183349609375, 1.6171875]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 7.0, 9.0, 17.0, 99.0, 217.0, 88.0, 22.0, 11.0, 9.0, 10.0, 5.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.651233673095703, -11.055516242980957, -10.459798812866211, -9.864081382751465, -9.268363952636719, -8.672646522521973, -8.076929092407227, -7.481212139129639, -6.885494709014893, -6.2897772789001465, -5.6940598487854, -5.0983428955078125, -4.502625465393066, -3.906907796859741, -3.311190605163574, -2.715473175048828, -2.119755744934082, -1.524038314819336, -0.9283210039138794, -0.33260369300842285, 0.26311373710632324, 0.8588311672210693, 1.4545483589172363, 2.0502657890319824, 2.6459832191467285, 3.2417006492614746, 3.8374180793762207, 4.433135032653809, 5.028852462768555, 5.624569892883301, 6.220287322998047, 6.816004753112793, 7.411722183227539, 8.007439613342285, 8.603157043457031, 9.198874473571777, 9.794591903686523, 10.39030933380127, 10.986026763916016, 11.581743240356445, 12.177461624145508, 12.773179054260254, 13.368896484375, 13.964613914489746, 14.560331344604492, 15.156048774719238, 15.751766204833984, 16.347482681274414, 16.943199157714844, 17.538915634155273, 18.134634017944336, 18.730350494384766, 19.326068878173828, 19.921785354614258, 20.51750373840332, 21.11322021484375, 21.708938598632812, 22.304655075073242, 22.900373458862305, 23.496089935302734, 24.091808319091797, 24.687524795532227, 25.28324317932129, 25.87895965576172, 26.47467803955078]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 3.0, 7.0, 7.0, 5.0, 6.0, 9.0, 16.0, 29.0, 86.0, 130.0, 89.0, 36.0, 13.0, 12.0, 6.0, 5.0, 5.0, 6.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.590359687805176, -8.335735321044922, -8.081110954284668, -7.826486587524414, -7.57186222076416, -7.317237854003906, -7.062613487243652, -6.807989120483398, -6.5533647537231445, -6.298740386962891, -6.044116020202637, -5.789491653442383, -5.534867286682129, -5.280242919921875, -5.025618553161621, -4.770994186401367, -4.516369819641113, -4.261745452880859, -4.0071210861206055, -3.7524967193603516, -3.4978723526000977, -3.2432479858398438, -2.98862361907959, -2.733999252319336, -2.479374885559082, -2.224750518798828, -1.9701261520385742, -1.7155017852783203, -1.4608774185180664, -1.2062530517578125, -0.9516286849975586, -0.6970043182373047, -0.4423809051513672, -0.18775653839111328, 0.06686782836914062, 0.32149219512939453, 0.5761165618896484, 0.8307409286499023, 1.0853652954101562, 1.3399896621704102, 1.594614028930664, 1.849238395690918, 2.103862762451172, 2.358487129211426, 2.6131114959716797, 2.8677358627319336, 3.1223602294921875, 3.3769845962524414, 3.6316089630126953, 3.886233329772949, 4.140857696533203, 4.395482063293457, 4.650106430053711, 4.904730796813965, 5.159355163574219, 5.413979530334473, 5.668603897094727, 5.9232282638549805, 6.177852630615234, 6.432476997375488, 6.687101364135742, 6.941725730895996, 7.19635009765625, 7.450974464416504, 7.705598831176758]}, "eval/loss": 4.188705921173096, "eval/wer": 2.4265370884569615, "eval/runtime": 1107.9648, "eval/samples_per_second": 2.385, "eval/steps_per_second": 0.299, "train/train_runtime": 8514.9113, "train/train_samples_per_second": 3.352, "train/train_steps_per_second": 0.21, "train/total_flos": 0.0, "train/train_loss": 4.24715919291492} \ No newline at end of file +{"train/loss": 3.5579, "train/learning_rate": 9.345794392523364e-08, "train/epoch": 1.0, "train/global_step": 1784, "_runtime": 9916, "_timestamp": 1646108188, "_step": 1788, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 20.0, 421.0, 554.0, 21.0, 0.0, 0.0, 2.0, 1.0], "bins": [-573.1256713867188, -563.2627563476562, -553.3998413085938, -543.5369873046875, -533.674072265625, -523.8111572265625, -513.9482421875, -504.0853271484375, -494.2224426269531, -484.3595275878906, -474.49664306640625, -464.63372802734375, -454.77081298828125, -444.9079284667969, -435.0450134277344, -425.18212890625, -415.3192138671875, -405.456298828125, -395.5934143066406, -385.7304992675781, -375.8675842285156, -366.00469970703125, -356.14178466796875, -346.27886962890625, -336.41595458984375, -326.55303955078125, -316.6901550292969, -306.8272399902344, -296.9643249511719, -287.1014404296875, -277.238525390625, -267.3756103515625, -257.5126953125, -247.64979553222656, -237.78688049316406, -227.92398071289062, -218.0610809326172, -208.19818115234375, -198.33526611328125, -188.4723663330078, -178.60946655273438, -168.74656677246094, -158.88365173339844, -149.020751953125, -139.15785217285156, -129.29495239257812, -119.43203735351562, -109.56913757324219, -99.70622253417969, -89.84331512451172, -79.98041534423828, -70.11750793457031, -60.25460433959961, -50.391700744628906, -40.52879333496094, -30.6658935546875, -20.802989959716797, -10.940085411071777, -1.0771808624267578, 8.785724639892578, 18.64862823486328, 28.511531829833984, 38.37443923950195, 48.23733901977539, 58.10024642944336]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 3.0, 3.0, 5.0, 2.0, 8.0, 9.0, 14.0, 11.0, 17.0, 21.0, 24.0, 25.0, 30.0, 26.0, 39.0, 40.0, 38.0, 43.0, 54.0, 42.0, 45.0, 42.0, 57.0, 37.0, 38.0, 45.0, 41.0, 37.0, 26.0, 28.0, 32.0, 21.0, 10.0, 17.0, 23.0, 9.0, 12.0, 10.0, 4.0, 11.0, 5.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-80.35408020019531, -78.11407470703125, -75.87406921386719, -73.63406372070312, -71.39405822753906, -69.154052734375, -66.91404724121094, -64.67404174804688, -62.43403625488281, -60.19403076171875, -57.95402526855469, -55.714019775390625, -53.47401428222656, -51.2340087890625, -48.99400329589844, -46.753997802734375, -44.51398849487305, -42.273983001708984, -40.03397750854492, -37.79397201538086, -35.5539665222168, -33.313961029052734, -31.07395362854004, -28.833948135375977, -26.593942642211914, -24.35393714904785, -22.11393165588379, -19.873924255371094, -17.63391876220703, -15.393914222717285, -13.153907775878906, -10.913902282714844, -8.673896789550781, -6.433891296386719, -4.193885326385498, -1.9538793563842773, 0.28612613677978516, 2.5261316299438477, 4.766138076782227, 7.006143569946289, 9.246149063110352, 11.486154556274414, 13.726160049438477, 15.966166496276855, 18.206172943115234, 20.446178436279297, 22.68618392944336, 24.926189422607422, 27.166194915771484, 29.406200408935547, 31.64620590209961, 33.88621139526367, 36.126216888427734, 38.3662223815918, 40.606231689453125, 42.84623718261719, 45.08624267578125, 47.32624816894531, 49.566253662109375, 51.80625915527344, 54.0462646484375, 56.28627014160156, 58.526275634765625, 60.76628112792969, 63.00628662109375]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 5.0, 7.0, 13.0, 20.0, 22.0, 27.0, 30.0, 48.0, 41.0, 58.0, 54.0, 51.0, 62.0, 54.0, 71.0, 57.0, 61.0, 53.0, 49.0, 38.0, 36.0, 40.0, 24.0, 21.0, 15.0, 14.0, 13.0, 5.0, 7.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.92578125, -6.7642822265625, -6.602783203125, -6.4412841796875, -6.27978515625, -6.1182861328125, -5.956787109375, -5.7952880859375, -5.6337890625, -5.4722900390625, -5.310791015625, -5.1492919921875, -4.98779296875, -4.8262939453125, -4.664794921875, -4.5032958984375, -4.341796875, -4.1802978515625, -4.018798828125, -3.8572998046875, -3.69580078125, -3.5343017578125, -3.372802734375, -3.2113037109375, -3.0498046875, -2.8883056640625, -2.726806640625, -2.5653076171875, -2.40380859375, -2.2423095703125, -2.080810546875, -1.9193115234375, -1.7578125, -1.5963134765625, -1.434814453125, -1.2733154296875, -1.11181640625, -0.9503173828125, -0.788818359375, -0.6273193359375, -0.4658203125, -0.3043212890625, -0.142822265625, 0.0186767578125, 0.18017578125, 0.3416748046875, 0.503173828125, 0.6646728515625, 0.826171875, 0.9876708984375, 1.149169921875, 1.3106689453125, 1.47216796875, 1.6336669921875, 1.795166015625, 1.9566650390625, 2.1181640625, 2.2796630859375, 2.441162109375, 2.6026611328125, 2.76416015625, 2.9256591796875, 3.087158203125, 3.2486572265625, 3.41015625]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 4.0, 2.0, 3.0, 9.0, 4.0, 9.0, 11.0, 17.0, 30.0, 62.0, 86.0, 116.0, 172.0, 373.0, 714.0, 1670.0, 5326.0, 26656.0, 482826.0, 3521891.0, 133920.0, 14339.0, 3441.0, 1325.0, 585.0, 289.0, 163.0, 85.0, 52.0, 40.0, 23.0, 17.0, 9.0, 12.0, 8.0, 1.0, 1.0], "bins": [-33.09375, -32.37939453125, -31.6650390625, -30.95068359375, -30.236328125, -29.52197265625, -28.8076171875, -28.09326171875, -27.37890625, -26.66455078125, -25.9501953125, -25.23583984375, -24.521484375, -23.80712890625, -23.0927734375, -22.37841796875, -21.6640625, -20.94970703125, -20.2353515625, -19.52099609375, -18.806640625, -18.09228515625, -17.3779296875, -16.66357421875, -15.94921875, -15.23486328125, -14.5205078125, -13.80615234375, -13.091796875, -12.37744140625, -11.6630859375, -10.94873046875, -10.234375, -9.52001953125, -8.8056640625, -8.09130859375, -7.376953125, -6.66259765625, -5.9482421875, -5.23388671875, -4.51953125, -3.80517578125, -3.0908203125, -2.37646484375, -1.662109375, -0.94775390625, -0.2333984375, 0.48095703125, 1.1953125, 1.90966796875, 2.6240234375, 3.33837890625, 4.052734375, 4.76708984375, 5.4814453125, 6.19580078125, 6.91015625, 7.62451171875, 8.3388671875, 9.05322265625, 9.767578125, 10.48193359375, 11.1962890625, 11.91064453125, 12.625]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 6.0, 8.0, 14.0, 34.0, 44.0, 74.0, 135.0, 237.0, 330.0, 585.0, 820.0, 699.0, 430.0, 254.0, 149.0, 100.0, 56.0, 34.0, 28.0, 16.0, 10.0, 2.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.890625, -15.219482421875, -14.54833984375, -13.877197265625, -13.2060546875, -12.534912109375, -11.86376953125, -11.192626953125, -10.521484375, -9.850341796875, -9.17919921875, -8.508056640625, -7.8369140625, -7.165771484375, -6.49462890625, -5.823486328125, -5.15234375, -4.481201171875, -3.81005859375, -3.138916015625, -2.4677734375, -1.796630859375, -1.12548828125, -0.454345703125, 0.216796875, 0.887939453125, 1.55908203125, 2.230224609375, 2.9013671875, 3.572509765625, 4.24365234375, 4.914794921875, 5.5859375, 6.257080078125, 6.92822265625, 7.599365234375, 8.2705078125, 8.941650390625, 9.61279296875, 10.283935546875, 10.955078125, 11.626220703125, 12.29736328125, 12.968505859375, 13.6396484375, 14.310791015625, 14.98193359375, 15.653076171875, 16.32421875, 16.995361328125, 17.66650390625, 18.337646484375, 19.0087890625, 19.679931640625, 20.35107421875, 21.022216796875, 21.693359375, 22.364501953125, 23.03564453125, 23.706787109375, 24.3779296875, 25.049072265625, 25.72021484375, 26.391357421875, 27.0625]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 4.0, 8.0, 18.0, 26.0, 29.0, 66.0, 112.0, 262.0, 565.0, 1339.0, 4538.0, 526046.0, 3648990.0, 9143.0, 1741.0, 686.0, 325.0, 153.0, 91.0, 62.0, 29.0, 12.0, 8.0, 4.0, 6.0, 5.0, 1.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-72.5625, -70.1552734375, -67.748046875, -65.3408203125, -62.93359375, -60.5263671875, -58.119140625, -55.7119140625, -53.3046875, -50.8974609375, -48.490234375, -46.0830078125, -43.67578125, -41.2685546875, -38.861328125, -36.4541015625, -34.046875, -31.6396484375, -29.232421875, -26.8251953125, -24.41796875, -22.0107421875, -19.603515625, -17.1962890625, -14.7890625, -12.3818359375, -9.974609375, -7.5673828125, -5.16015625, -2.7529296875, -0.345703125, 2.0615234375, 4.46875, 6.8759765625, 9.283203125, 11.6904296875, 14.09765625, 16.5048828125, 18.912109375, 21.3193359375, 23.7265625, 26.1337890625, 28.541015625, 30.9482421875, 33.35546875, 35.7626953125, 38.169921875, 40.5771484375, 42.984375, 45.3916015625, 47.798828125, 50.2060546875, 52.61328125, 55.0205078125, 57.427734375, 59.8349609375, 62.2421875, 64.6494140625, 67.056640625, 69.4638671875, 71.87109375, 74.2783203125, 76.685546875, 79.0927734375, 81.5]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 16.0, 44.0, 193.0, 425.0, 243.0, 73.0, 14.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-212.2716064453125, -208.23072814941406, -204.18984985351562, -200.1489715576172, -196.10809326171875, -192.0672149658203, -188.02633666992188, -183.9854736328125, -179.944580078125, -175.90370178222656, -171.86282348632812, -167.8219451904297, -163.78106689453125, -159.7401885986328, -155.69931030273438, -151.658447265625, -147.61756896972656, -143.57669067382812, -139.5358123779297, -135.49493408203125, -131.4540557861328, -127.41317749023438, -123.37230682373047, -119.33142852783203, -115.2905502319336, -111.24967193603516, -107.20879364013672, -103.16791534423828, -99.12704467773438, -95.08616638183594, -91.0452880859375, -87.00440979003906, -82.96353149414062, -78.92265319824219, -74.88177490234375, -70.84089660644531, -66.80001831054688, -62.7591438293457, -58.71826934814453, -54.677391052246094, -50.63651657104492, -46.595638275146484, -42.55476379394531, -38.513885498046875, -34.47300720214844, -30.43212890625, -26.391252517700195, -22.35037612915039, -18.309497833251953, -14.268620491027832, -10.227743148803711, -6.18686580657959, -2.1459884643554688, 1.8948898315429688, 5.935766220092773, 9.976642608642578, 14.017520904541016, 18.058399200439453, 22.099275588989258, 26.140151977539062, 30.1810302734375, 34.22190856933594, 38.262786865234375, 42.30366134643555, 46.344539642333984]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 1.0, 5.0, 9.0, 5.0, 12.0, 5.0, 20.0, 14.0, 16.0, 19.0, 22.0, 21.0, 16.0, 37.0, 31.0, 42.0, 26.0, 30.0, 44.0, 38.0, 37.0, 30.0, 30.0, 37.0, 39.0, 41.0, 33.0, 51.0, 31.0, 34.0, 28.0, 28.0, 21.0, 19.0, 14.0, 27.0, 12.0, 11.0, 7.0, 13.0, 6.0, 7.0, 6.0, 10.0, 6.0, 1.0, 4.0, 0.0, 1.0, 3.0, 3.0], "bins": [-44.282958984375, -43.00820541381836, -41.73345184326172, -40.45869827270508, -39.18394470214844, -37.9091911315918, -36.634437561035156, -35.35968780517578, -34.084930419921875, -32.810176849365234, -31.535423278808594, -30.260669708251953, -28.985916137695312, -27.711162567138672, -26.436410903930664, -25.161657333374023, -23.886905670166016, -22.612152099609375, -21.337398529052734, -20.062644958496094, -18.787891387939453, -17.513137817382812, -16.238386154174805, -14.963632583618164, -13.688879013061523, -12.414125442504883, -11.139371871948242, -9.864619255065918, -8.589865684509277, -7.315112113952637, -6.040359020233154, -4.765605926513672, -3.4908523559570312, -2.2160990238189697, -0.9413456916809082, 0.3334076404571533, 1.6081609725952148, 2.8829145431518555, 4.157667636871338, 5.43242073059082, 6.707174301147461, 7.981927871704102, 9.256681442260742, 10.531434059143066, 11.806187629699707, 13.080941200256348, 14.355693817138672, 15.630447387695312, 16.905200958251953, 18.179954528808594, 19.454708099365234, 20.729461669921875, 22.004215240478516, 23.278968811035156, 24.553720474243164, 25.828474044799805, 27.103227615356445, 28.377981185913086, 29.652734756469727, 30.927488327026367, 32.202239990234375, 33.476993560791016, 34.751747131347656, 36.0265007019043, 37.30125427246094]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 7.0, 4.0, 4.0, 16.0, 20.0, 17.0, 28.0, 26.0, 46.0, 33.0, 54.0, 58.0, 44.0, 50.0, 50.0, 70.0, 60.0, 62.0, 52.0, 41.0, 55.0, 30.0, 42.0, 39.0, 31.0, 16.0, 18.0, 13.0, 10.0, 3.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.3828125, -6.216796875, -6.05078125, -5.884765625, -5.71875, -5.552734375, -5.38671875, -5.220703125, -5.0546875, -4.888671875, -4.72265625, -4.556640625, -4.390625, -4.224609375, -4.05859375, -3.892578125, -3.7265625, -3.560546875, -3.39453125, -3.228515625, -3.0625, -2.896484375, -2.73046875, -2.564453125, -2.3984375, -2.232421875, -2.06640625, -1.900390625, -1.734375, -1.568359375, -1.40234375, -1.236328125, -1.0703125, -0.904296875, -0.73828125, -0.572265625, -0.40625, -0.240234375, -0.07421875, 0.091796875, 0.2578125, 0.423828125, 0.58984375, 0.755859375, 0.921875, 1.087890625, 1.25390625, 1.419921875, 1.5859375, 1.751953125, 1.91796875, 2.083984375, 2.25, 2.416015625, 2.58203125, 2.748046875, 2.9140625, 3.080078125, 3.24609375, 3.412109375, 3.578125, 3.744140625, 3.91015625, 4.076171875, 4.2421875]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 2.0, 7.0, 14.0, 13.0, 29.0, 46.0, 60.0, 85.0, 110.0, 191.0, 242.0, 364.0, 519.0, 720.0, 1137.0, 1540.0, 2265.0, 3384.0, 4838.0, 7391.0, 10979.0, 16461.0, 24432.0, 37086.0, 56146.0, 87430.0, 130522.0, 171932.0, 158227.0, 113185.0, 74671.0, 48235.0, 31832.0, 21042.0, 14026.0, 9492.0, 6240.0, 4304.0, 2913.0, 1946.0, 1404.0, 934.0, 659.0, 475.0, 321.0, 234.0, 148.0, 101.0, 84.0, 58.0, 31.0, 25.0, 13.0, 8.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.34619140625, -0.3349571228027344, -0.32372283935546875, -0.3124885559082031, -0.3012542724609375, -0.2900199890136719, -0.27878570556640625, -0.2675514221191406, -0.256317138671875, -0.24508285522460938, -0.23384857177734375, -0.22261428833007812, -0.2113800048828125, -0.20014572143554688, -0.18891143798828125, -0.17767715454101562, -0.16644287109375, -0.15520858764648438, -0.14397430419921875, -0.13274002075195312, -0.1215057373046875, -0.11027145385742188, -0.09903717041015625, -0.08780288696289062, -0.076568603515625, -0.06533432006835938, -0.05410003662109375, -0.042865753173828125, -0.0316314697265625, -0.020397186279296875, -0.00916290283203125, 0.002071380615234375, 0.0133056640625, 0.024539947509765625, 0.03577423095703125, 0.047008514404296875, 0.0582427978515625, 0.06947708129882812, 0.08071136474609375, 0.09194564819335938, 0.103179931640625, 0.11441421508789062, 0.12564849853515625, 0.13688278198242188, 0.1481170654296875, 0.15935134887695312, 0.17058563232421875, 0.18181991577148438, 0.19305419921875, 0.20428848266601562, 0.21552276611328125, 0.22675704956054688, 0.2379913330078125, 0.24922561645507812, 0.26045989990234375, 0.2716941833496094, 0.282928466796875, 0.2941627502441406, 0.30539703369140625, 0.3166313171386719, 0.3278656005859375, 0.3390998840332031, 0.35033416748046875, 0.3615684509277344, 0.372802734375]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 4.0, 3.0, 5.0, 4.0, 5.0, 5.0, 10.0, 8.0, 14.0, 18.0, 16.0, 14.0, 19.0, 30.0, 31.0, 27.0, 32.0, 29.0, 46.0, 42.0, 40.0, 38.0, 47.0, 1066.0, 33.0, 33.0, 48.0, 41.0, 35.0, 32.0, 21.0, 34.0, 32.0, 25.0, 14.0, 29.0, 18.0, 14.0, 10.0, 16.0, 8.0, 8.0, 9.0, 8.0, 3.0, 3.0, 1.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.287109375, -2.214141845703125, -2.14117431640625, -2.068206787109375, -1.9952392578125, -1.922271728515625, -1.84930419921875, -1.776336669921875, -1.703369140625, -1.630401611328125, -1.55743408203125, -1.484466552734375, -1.4114990234375, -1.338531494140625, -1.26556396484375, -1.192596435546875, -1.11962890625, -1.046661376953125, -0.97369384765625, -0.900726318359375, -0.8277587890625, -0.754791259765625, -0.68182373046875, -0.608856201171875, -0.535888671875, -0.462921142578125, -0.38995361328125, -0.316986083984375, -0.2440185546875, -0.171051025390625, -0.09808349609375, -0.025115966796875, 0.0478515625, 0.120819091796875, 0.19378662109375, 0.266754150390625, 0.3397216796875, 0.412689208984375, 0.48565673828125, 0.558624267578125, 0.631591796875, 0.704559326171875, 0.77752685546875, 0.850494384765625, 0.9234619140625, 0.996429443359375, 1.06939697265625, 1.142364501953125, 1.21533203125, 1.288299560546875, 1.36126708984375, 1.434234619140625, 1.5072021484375, 1.580169677734375, 1.65313720703125, 1.726104736328125, 1.799072265625, 1.872039794921875, 1.94500732421875, 2.017974853515625, 2.0909423828125, 2.163909912109375, 2.23687744140625, 2.309844970703125, 2.3828125]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 6.0, 6.0, 4.0, 11.0, 14.0, 23.0, 36.0, 58.0, 92.0, 102.0, 189.0, 303.0, 514.0, 755.0, 1359.0, 2123.0, 3583.0, 5903.0, 9968.0, 16434.0, 26980.0, 44670.0, 72015.0, 111197.0, 154575.0, 1220992.0, 148644.0, 103884.0, 67155.0, 41641.0, 25327.0, 15238.0, 9227.0, 5613.0, 3340.0, 2023.0, 1206.0, 734.0, 445.0, 258.0, 176.0, 96.0, 74.0, 52.0, 28.0, 20.0, 15.0, 14.0, 8.0, 6.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.284423828125, -0.2753715515136719, -0.26631927490234375, -0.2572669982910156, -0.2482147216796875, -0.23916244506835938, -0.23011016845703125, -0.22105789184570312, -0.212005615234375, -0.20295333862304688, -0.19390106201171875, -0.18484878540039062, -0.1757965087890625, -0.16674423217773438, -0.15769195556640625, -0.14863967895507812, -0.13958740234375, -0.13053512573242188, -0.12148284912109375, -0.11243057250976562, -0.1033782958984375, -0.09432601928710938, -0.08527374267578125, -0.07622146606445312, -0.067169189453125, -0.058116912841796875, -0.04906463623046875, -0.040012359619140625, -0.0309600830078125, -0.021907806396484375, -0.01285552978515625, -0.003803253173828125, 0.0052490234375, 0.014301300048828125, 0.02335357666015625, 0.032405853271484375, 0.0414581298828125, 0.050510406494140625, 0.05956268310546875, 0.06861495971679688, 0.077667236328125, 0.08671951293945312, 0.09577178955078125, 0.10482406616210938, 0.1138763427734375, 0.12292861938476562, 0.13198089599609375, 0.14103317260742188, 0.15008544921875, 0.15913772583007812, 0.16819000244140625, 0.17724227905273438, 0.1862945556640625, 0.19534683227539062, 0.20439910888671875, 0.21345138549804688, 0.222503662109375, 0.23155593872070312, 0.24060821533203125, 0.24966049194335938, 0.2587127685546875, 0.2677650451660156, 0.27681732177734375, 0.2858695983886719, 0.294921875]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 5.0, 4.0, 4.0, 5.0, 9.0, 11.0, 4.0, 20.0, 16.0, 12.0, 30.0, 38.0, 44.0, 42.0, 59.0, 65.0, 57.0, 56.0, 71.0, 75.0, 47.0, 58.0, 42.0, 54.0, 35.0, 30.0, 21.0, 12.0, 17.0, 14.0, 8.0, 10.0, 13.0, 3.0, 3.0, 1.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0020160675048828125, -0.0019510090351104736, -0.0018859505653381348, -0.001820892095565796, -0.001755833625793457, -0.0016907751560211182, -0.0016257166862487793, -0.0015606582164764404, -0.0014955997467041016, -0.0014305412769317627, -0.0013654828071594238, -0.001300424337387085, -0.001235365867614746, -0.0011703073978424072, -0.0011052489280700684, -0.0010401904582977295, -0.0009751319885253906, -0.0009100735187530518, -0.0008450150489807129, -0.000779956579208374, -0.0007148981094360352, -0.0006498396396636963, -0.0005847811698913574, -0.0005197227001190186, -0.0004546642303466797, -0.0003896057605743408, -0.00032454729080200195, -0.0002594888210296631, -0.00019443035125732422, -0.00012937188148498535, -6.431341171264648e-05, 7.450580596923828e-07, 6.580352783203125e-05, 0.00013086199760437012, 0.00019592046737670898, 0.00026097893714904785, 0.0003260374069213867, 0.0003910958766937256, 0.00045615434646606445, 0.0005212128162384033, 0.0005862712860107422, 0.0006513297557830811, 0.0007163882255554199, 0.0007814466953277588, 0.0008465051651000977, 0.0009115636348724365, 0.0009766221046447754, 0.0010416805744171143, 0.0011067390441894531, 0.001171797513961792, 0.0012368559837341309, 0.0013019144535064697, 0.0013669729232788086, 0.0014320313930511475, 0.0014970898628234863, 0.0015621483325958252, 0.001627206802368164, 0.001692265272140503, 0.0017573237419128418, 0.0018223822116851807, 0.0018874406814575195, 0.0019524991512298584, 0.0020175576210021973, 0.002082616090774536, 0.002147674560546875]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 4.0, 3.0, 9.0, 9.0, 15.0, 10.0, 13.0, 13.0, 22.0, 29.0, 39.0, 45.0, 49.0, 74.0, 103.0, 141.0, 137.0, 191.0, 344.0, 716.0, 5486.0, 1028896.0, 9972.0, 807.0, 412.0, 256.0, 158.0, 129.0, 107.0, 78.0, 45.0, 49.0, 28.0, 30.0, 20.0, 27.0, 28.0, 12.0, 6.0, 8.0, 10.0, 5.0, 5.0, 3.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.0401611328125, -0.038999080657958984, -0.03783702850341797, -0.03667497634887695, -0.03551292419433594, -0.03435087203979492, -0.033188819885253906, -0.03202676773071289, -0.030864715576171875, -0.02970266342163086, -0.028540611267089844, -0.027378559112548828, -0.026216506958007812, -0.025054454803466797, -0.02389240264892578, -0.022730350494384766, -0.02156829833984375, -0.020406246185302734, -0.01924419403076172, -0.018082141876220703, -0.016920089721679688, -0.015758037567138672, -0.014595985412597656, -0.01343393325805664, -0.012271881103515625, -0.01110982894897461, -0.009947776794433594, -0.008785724639892578, -0.0076236724853515625, -0.006461620330810547, -0.005299568176269531, -0.004137516021728516, -0.0029754638671875, -0.0018134117126464844, -0.0006513595581054688, 0.0005106925964355469, 0.0016727447509765625, 0.002834796905517578, 0.003996849060058594, 0.005158901214599609, 0.006320953369140625, 0.007483005523681641, 0.008645057678222656, 0.009807109832763672, 0.010969161987304688, 0.012131214141845703, 0.013293266296386719, 0.014455318450927734, 0.01561737060546875, 0.016779422760009766, 0.01794147491455078, 0.019103527069091797, 0.020265579223632812, 0.021427631378173828, 0.022589683532714844, 0.02375173568725586, 0.024913787841796875, 0.02607583999633789, 0.027237892150878906, 0.028399944305419922, 0.029561996459960938, 0.030724048614501953, 0.03188610076904297, 0.033048152923583984, 0.034210205078125]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 979.0, 34.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.028607146814465523, -0.027993997558951378, -0.027380848303437233, -0.026767700910568237, -0.026154551655054092, -0.025541402399539948, -0.024928253144025803, -0.024315103888511658, -0.023701954632997513, -0.023088805377483368, -0.022475656121969223, -0.021862506866455078, -0.021249359473586082, -0.020636210218071938, -0.020023060962557793, -0.019409911707043648, -0.018796764314174652, -0.018183615058660507, -0.017570465803146362, -0.016957316547632217, -0.016344169154763222, -0.015731019899249077, -0.015117870643734932, -0.014504721388220787, -0.013891572132706642, -0.013278422877192497, -0.012665274553000927, -0.012052125297486782, -0.011438976041972637, -0.010825827717781067, -0.010212678462266922, -0.009599529206752777, -0.008986380882561207, -0.008373231627047062, -0.007760082837194204, -0.007146934047341347, -0.006533784791827202, -0.005920636001974344, -0.005307487212121487, -0.004694337956607342, -0.004081189166754484, -0.003468040144070983, -0.0028548911213874817, -0.002241742331534624, -0.0016285933088511229, -0.0010154442861676216, -0.000402295496314764, 0.00021085375919938087, 0.0008240025490522385, 0.0014371515717357397, 0.002050300594419241, 0.0026634493842720985, 0.0032765984069556, 0.003889747429639101, 0.004502896219491959, 0.0051160454750061035, 0.005729194264858961, 0.006342343054711819, 0.006955492310225964, 0.007568641100078821, 0.008181789889931679, 0.008794939145445824, 0.009408088400959969, 0.010021237656474113, 0.010634385980665684]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 9.0, 7.0, 4.0, 11.0, 10.0, 20.0, 25.0, 26.0, 53.0, 35.0, 36.0, 55.0, 59.0, 55.0, 68.0, 55.0, 69.0, 66.0, 62.0, 52.0, 51.0, 43.0, 37.0, 16.0, 22.0, 12.0, 10.0, 10.0, 5.0, 7.0, 6.0, 7.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0011274218559265137, -0.0010774759575724602, -0.0010275300592184067, -0.0009775841608643532, -0.0009276382625102997, -0.0008776923641562462, -0.0008277464658021927, -0.0007778005674481392, -0.0007278546690940857, -0.0006779087707400322, -0.0006279628723859787, -0.0005780169740319252, -0.0005280710756778717, -0.0004781251773238182, -0.0004281792789697647, -0.0003782333806157112, -0.0003282874822616577, -0.0002783415839076042, -0.00022839568555355072, -0.00017844978719949722, -0.00012850388884544373, -7.855799049139023e-05, -2.861209213733673e-05, 2.1333806216716766e-05, 7.127970457077026e-05, 0.00012122560292482376, 0.00017117150127887726, 0.00022111739963293076, 0.00027106329798698425, 0.00032100919634103775, 0.00037095509469509125, 0.00042090099304914474, 0.00047084689140319824, 0.0005207927897572517, 0.0005707386881113052, 0.0006206845864653587, 0.0006706304848194122, 0.0007205763831734657, 0.0007705222815275192, 0.0008204681798815727, 0.0008704140782356262, 0.0009203599765896797, 0.0009703058749437332, 0.0010202517732977867, 0.0010701976716518402, 0.0011201435700058937, 0.0011700894683599472, 0.0012200353667140007, 0.0012699812650680542, 0.0013199271634221077, 0.0013698730617761612, 0.0014198189601302147, 0.0014697648584842682, 0.0015197107568383217, 0.0015696566551923752, 0.0016196025535464287, 0.0016695484519004822, 0.0017194943502545357, 0.0017694402486085892, 0.0018193861469626427, 0.0018693320453166962, 0.0019192779436707497, 0.001969223842024803, 0.0020191697403788567, 0.00206911563873291]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 7.0, 4.0, 4.0, 16.0, 20.0, 17.0, 28.0, 26.0, 46.0, 33.0, 54.0, 58.0, 44.0, 50.0, 50.0, 70.0, 60.0, 62.0, 52.0, 41.0, 55.0, 30.0, 42.0, 39.0, 31.0, 16.0, 18.0, 13.0, 10.0, 3.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.3828125, -6.216796875, -6.05078125, -5.884765625, -5.71875, -5.552734375, -5.38671875, -5.220703125, -5.0546875, -4.888671875, -4.72265625, -4.556640625, -4.390625, -4.224609375, -4.05859375, -3.892578125, -3.7265625, -3.560546875, -3.39453125, -3.228515625, -3.0625, -2.896484375, -2.73046875, -2.564453125, -2.3984375, -2.232421875, -2.06640625, -1.900390625, -1.734375, -1.568359375, -1.40234375, -1.236328125, -1.0703125, -0.904296875, -0.73828125, -0.572265625, -0.40625, -0.240234375, -0.07421875, 0.091796875, 0.2578125, 0.423828125, 0.58984375, 0.755859375, 0.921875, 1.087890625, 1.25390625, 1.419921875, 1.5859375, 1.751953125, 1.91796875, 2.083984375, 2.25, 2.416015625, 2.58203125, 2.748046875, 2.9140625, 3.080078125, 3.24609375, 3.412109375, 3.578125, 3.744140625, 3.91015625, 4.076171875, 4.2421875]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 5.0, 4.0, 6.0, 13.0, 5.0, 13.0, 26.0, 29.0, 33.0, 64.0, 62.0, 131.0, 181.0, 224.0, 401.0, 512.0, 884.0, 1401.0, 2391.0, 3829.0, 6746.0, 13246.0, 34029.0, 348266.0, 559734.0, 42755.0, 15040.0, 7447.0, 4349.0, 2382.0, 1483.0, 962.0, 613.0, 397.0, 273.0, 188.0, 137.0, 84.0, 57.0, 46.0, 27.0, 29.0, 14.0, 16.0, 12.0, 6.0, 1.0, 2.0, 4.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.65625, -18.07470703125, -17.4931640625, -16.91162109375, -16.330078125, -15.74853515625, -15.1669921875, -14.58544921875, -14.00390625, -13.42236328125, -12.8408203125, -12.25927734375, -11.677734375, -11.09619140625, -10.5146484375, -9.93310546875, -9.3515625, -8.77001953125, -8.1884765625, -7.60693359375, -7.025390625, -6.44384765625, -5.8623046875, -5.28076171875, -4.69921875, -4.11767578125, -3.5361328125, -2.95458984375, -2.373046875, -1.79150390625, -1.2099609375, -0.62841796875, -0.046875, 0.53466796875, 1.1162109375, 1.69775390625, 2.279296875, 2.86083984375, 3.4423828125, 4.02392578125, 4.60546875, 5.18701171875, 5.7685546875, 6.35009765625, 6.931640625, 7.51318359375, 8.0947265625, 8.67626953125, 9.2578125, 9.83935546875, 10.4208984375, 11.00244140625, 11.583984375, 12.16552734375, 12.7470703125, 13.32861328125, 13.91015625, 14.49169921875, 15.0732421875, 15.65478515625, 16.236328125, 16.81787109375, 17.3994140625, 17.98095703125, 18.5625]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 4.0, 6.0, 2.0, 5.0, 7.0, 8.0, 10.0, 11.0, 16.0, 24.0, 14.0, 30.0, 32.0, 29.0, 40.0, 37.0, 46.0, 60.0, 56.0, 113.0, 412.0, 1511.0, 162.0, 57.0, 53.0, 49.0, 47.0, 29.0, 47.0, 25.0, 18.0, 19.0, 19.0, 17.0, 9.0, 10.0, 6.0, 5.0, 4.0, 5.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-15.765625, -15.3408203125, -14.916015625, -14.4912109375, -14.06640625, -13.6416015625, -13.216796875, -12.7919921875, -12.3671875, -11.9423828125, -11.517578125, -11.0927734375, -10.66796875, -10.2431640625, -9.818359375, -9.3935546875, -8.96875, -8.5439453125, -8.119140625, -7.6943359375, -7.26953125, -6.8447265625, -6.419921875, -5.9951171875, -5.5703125, -5.1455078125, -4.720703125, -4.2958984375, -3.87109375, -3.4462890625, -3.021484375, -2.5966796875, -2.171875, -1.7470703125, -1.322265625, -0.8974609375, -0.47265625, -0.0478515625, 0.376953125, 0.8017578125, 1.2265625, 1.6513671875, 2.076171875, 2.5009765625, 2.92578125, 3.3505859375, 3.775390625, 4.2001953125, 4.625, 5.0498046875, 5.474609375, 5.8994140625, 6.32421875, 6.7490234375, 7.173828125, 7.5986328125, 8.0234375, 8.4482421875, 8.873046875, 9.2978515625, 9.72265625, 10.1474609375, 10.572265625, 10.9970703125, 11.421875]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 5.0, 9.0, 10.0, 11.0, 7.0, 21.0, 13.0, 31.0, 18.0, 39.0, 31.0, 62.0, 62.0, 130.0, 273.0, 1353.0, 2075228.0, 1066373.0, 1222.0, 291.0, 141.0, 86.0, 59.0, 36.0, 35.0, 25.0, 21.0, 22.0, 14.0, 17.0, 19.0, 4.0, 8.0, 7.0, 6.0, 3.0, 4.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.53125, -47.69580078125, -45.8603515625, -44.02490234375, -42.189453125, -40.35400390625, -38.5185546875, -36.68310546875, -34.84765625, -33.01220703125, -31.1767578125, -29.34130859375, -27.505859375, -25.67041015625, -23.8349609375, -21.99951171875, -20.1640625, -18.32861328125, -16.4931640625, -14.65771484375, -12.822265625, -10.98681640625, -9.1513671875, -7.31591796875, -5.48046875, -3.64501953125, -1.8095703125, 0.02587890625, 1.861328125, 3.69677734375, 5.5322265625, 7.36767578125, 9.203125, 11.03857421875, 12.8740234375, 14.70947265625, 16.544921875, 18.38037109375, 20.2158203125, 22.05126953125, 23.88671875, 25.72216796875, 27.5576171875, 29.39306640625, 31.228515625, 33.06396484375, 34.8994140625, 36.73486328125, 38.5703125, 40.40576171875, 42.2412109375, 44.07666015625, 45.912109375, 47.74755859375, 49.5830078125, 51.41845703125, 53.25390625, 55.08935546875, 56.9248046875, 58.76025390625, 60.595703125, 62.43115234375, 64.2666015625, 66.10205078125, 67.9375]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 94.0, 612.0, 286.0, 18.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.560911178588867, -9.121329307556152, -6.6817474365234375, -4.242165565490723, -1.8025836944580078, 0.636998176574707, 3.076580047607422, 5.51616096496582, 7.955743789672852, 10.395325660705566, 12.834907531738281, 15.274489402770996, 17.71407127380371, 20.15365219116211, 22.59323501586914, 25.03281593322754, 27.47239875793457, 29.91197967529297, 32.3515625, 34.79114532470703, 37.23072814941406, 39.67030715942383, 42.10988998413086, 44.549468994140625, 46.989051818847656, 49.42863464355469, 51.86821746826172, 54.307796478271484, 56.747379302978516, 59.18696212768555, 61.62654113769531, 64.06612396240234, 66.50570678710938, 68.9452896118164, 71.38487243652344, 73.82445526123047, 76.2640380859375, 78.70361328125, 81.14319610595703, 83.58277893066406, 86.0223617553711, 88.46194458007812, 90.90152740478516, 93.34111022949219, 95.78068542480469, 98.22026824951172, 100.65985107421875, 103.09943389892578, 105.53901672363281, 107.97859954833984, 110.41818237304688, 112.8577651977539, 115.29734802246094, 117.73692321777344, 120.17650604248047, 122.6160888671875, 125.05567169189453, 127.49525451660156, 129.93482971191406, 132.37442016601562, 134.81399536132812, 137.2535858154297, 139.6931610107422, 142.13275146484375, 144.57232666015625]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 6.0, 2.0, 2.0, 9.0, 10.0, 9.0, 16.0, 12.0, 14.0, 19.0, 18.0, 24.0, 26.0, 29.0, 21.0, 35.0, 32.0, 33.0, 36.0, 41.0, 35.0, 40.0, 44.0, 53.0, 38.0, 41.0, 34.0, 32.0, 38.0, 47.0, 37.0, 26.0, 22.0, 18.0, 22.0, 15.0, 11.0, 12.0, 12.0, 10.0, 7.0, 9.0, 5.0, 3.0, 2.0, 3.0, 0.0, 3.0, 2.0], "bins": [-46.899314880371094, -45.650611877441406, -44.40190505981445, -43.153202056884766, -41.90449905395508, -40.655792236328125, -39.40708923339844, -38.15838623046875, -36.9096794128418, -35.66097640991211, -34.412269592285156, -33.16356658935547, -31.91486167907715, -30.666156768798828, -29.41745376586914, -28.16874885559082, -26.920045852661133, -25.671340942382812, -24.422637939453125, -23.173933029174805, -21.925228118896484, -20.676525115966797, -19.427820205688477, -18.179115295410156, -16.93041229248047, -15.681708335876465, -14.433003425598145, -13.18429946899414, -11.93559455871582, -10.686890602111816, -9.438186645507812, -8.189481735229492, -6.940776824951172, -5.69207239151001, -4.443367958068848, -3.1946640014648438, -1.9459595680236816, -0.6972551345825195, 0.5514488220214844, 1.8001537322998047, 3.0488576889038086, 4.297562122344971, 5.546266555786133, 6.794970512390137, 8.04367446899414, 9.292379379272461, 10.541083335876465, 11.789788246154785, 13.038492202758789, 14.287196159362793, 15.535901069641113, 16.784605026245117, 18.033309936523438, 19.282012939453125, 20.530717849731445, 21.779422760009766, 23.028125762939453, 24.276830673217773, 25.52553367614746, 26.77423858642578, 28.0229434967041, 29.271648406982422, 30.52035140991211, 31.76905632019043, 33.01776123046875]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 7.0, 10.0, 12.0, 20.0, 21.0, 20.0, 40.0, 35.0, 36.0, 51.0, 49.0, 49.0, 35.0, 61.0, 72.0, 49.0, 55.0, 53.0, 37.0, 45.0, 52.0, 28.0, 35.0, 32.0, 34.0, 22.0, 16.0, 7.0, 3.0, 7.0, 6.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.390625, -6.2210693359375, -6.051513671875, -5.8819580078125, -5.71240234375, -5.5428466796875, -5.373291015625, -5.2037353515625, -5.0341796875, -4.8646240234375, -4.695068359375, -4.5255126953125, -4.35595703125, -4.1864013671875, -4.016845703125, -3.8472900390625, -3.677734375, -3.5081787109375, -3.338623046875, -3.1690673828125, -2.99951171875, -2.8299560546875, -2.660400390625, -2.4908447265625, -2.3212890625, -2.1517333984375, -1.982177734375, -1.8126220703125, -1.64306640625, -1.4735107421875, -1.303955078125, -1.1343994140625, -0.96484375, -0.7952880859375, -0.625732421875, -0.4561767578125, -0.28662109375, -0.1170654296875, 0.052490234375, 0.2220458984375, 0.3916015625, 0.5611572265625, 0.730712890625, 0.9002685546875, 1.06982421875, 1.2393798828125, 1.408935546875, 1.5784912109375, 1.748046875, 1.9176025390625, 2.087158203125, 2.2567138671875, 2.42626953125, 2.5958251953125, 2.765380859375, 2.9349365234375, 3.1044921875, 3.2740478515625, 3.443603515625, 3.6131591796875, 3.78271484375, 3.9522705078125, 4.121826171875, 4.2913818359375, 4.4609375]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 3.0, 2.0, 9.0, 9.0, 14.0, 20.0, 40.0, 78.0, 90.0, 179.0, 303.0, 581.0, 1442.0, 4561.0, 24196.0, 390990.0, 3632661.0, 120839.0, 13014.0, 3091.0, 1052.0, 488.0, 227.0, 145.0, 89.0, 70.0, 35.0, 20.0, 15.0, 12.0, 9.0, 6.0, 2.0, 1.0, 0.0, 1.0], "bins": [-40.375, -39.46435546875, -38.5537109375, -37.64306640625, -36.732421875, -35.82177734375, -34.9111328125, -34.00048828125, -33.08984375, -32.17919921875, -31.2685546875, -30.35791015625, -29.447265625, -28.53662109375, -27.6259765625, -26.71533203125, -25.8046875, -24.89404296875, -23.9833984375, -23.07275390625, -22.162109375, -21.25146484375, -20.3408203125, -19.43017578125, -18.51953125, -17.60888671875, -16.6982421875, -15.78759765625, -14.876953125, -13.96630859375, -13.0556640625, -12.14501953125, -11.234375, -10.32373046875, -9.4130859375, -8.50244140625, -7.591796875, -6.68115234375, -5.7705078125, -4.85986328125, -3.94921875, -3.03857421875, -2.1279296875, -1.21728515625, -0.306640625, 0.60400390625, 1.5146484375, 2.42529296875, 3.3359375, 4.24658203125, 5.1572265625, 6.06787109375, 6.978515625, 7.88916015625, 8.7998046875, 9.71044921875, 10.62109375, 11.53173828125, 12.4423828125, 13.35302734375, 14.263671875, 15.17431640625, 16.0849609375, 16.99560546875, 17.90625]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 5.0, 1.0, 10.0, 9.0, 30.0, 37.0, 71.0, 116.0, 154.0, 259.0, 422.0, 640.0, 763.0, 603.0, 369.0, 234.0, 130.0, 73.0, 61.0, 41.0, 23.0, 9.0, 9.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.359375, -18.6533203125, -17.947265625, -17.2412109375, -16.53515625, -15.8291015625, -15.123046875, -14.4169921875, -13.7109375, -13.0048828125, -12.298828125, -11.5927734375, -10.88671875, -10.1806640625, -9.474609375, -8.7685546875, -8.0625, -7.3564453125, -6.650390625, -5.9443359375, -5.23828125, -4.5322265625, -3.826171875, -3.1201171875, -2.4140625, -1.7080078125, -1.001953125, -0.2958984375, 0.41015625, 1.1162109375, 1.822265625, 2.5283203125, 3.234375, 3.9404296875, 4.646484375, 5.3525390625, 6.05859375, 6.7646484375, 7.470703125, 8.1767578125, 8.8828125, 9.5888671875, 10.294921875, 11.0009765625, 11.70703125, 12.4130859375, 13.119140625, 13.8251953125, 14.53125, 15.2373046875, 15.943359375, 16.6494140625, 17.35546875, 18.0615234375, 18.767578125, 19.4736328125, 20.1796875, 20.8857421875, 21.591796875, 22.2978515625, 23.00390625, 23.7099609375, 24.416015625, 25.1220703125, 25.828125]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 1.0, 12.0, 7.0, 8.0, 25.0, 18.0, 45.0, 56.0, 105.0, 176.0, 377.0, 1285.0, 16107.0, 3893395.0, 277834.0, 3443.0, 669.0, 327.0, 142.0, 76.0, 61.0, 17.0, 30.0, 18.0, 13.0, 12.0, 6.0, 4.0, 3.0, 6.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.65625, -44.40869140625, -42.1611328125, -39.91357421875, -37.666015625, -35.41845703125, -33.1708984375, -30.92333984375, -28.67578125, -26.42822265625, -24.1806640625, -21.93310546875, -19.685546875, -17.43798828125, -15.1904296875, -12.94287109375, -10.6953125, -8.44775390625, -6.2001953125, -3.95263671875, -1.705078125, 0.54248046875, 2.7900390625, 5.03759765625, 7.28515625, 9.53271484375, 11.7802734375, 14.02783203125, 16.275390625, 18.52294921875, 20.7705078125, 23.01806640625, 25.265625, 27.51318359375, 29.7607421875, 32.00830078125, 34.255859375, 36.50341796875, 38.7509765625, 40.99853515625, 43.24609375, 45.49365234375, 47.7412109375, 49.98876953125, 52.236328125, 54.48388671875, 56.7314453125, 58.97900390625, 61.2265625, 63.47412109375, 65.7216796875, 67.96923828125, 70.216796875, 72.46435546875, 74.7119140625, 76.95947265625, 79.20703125, 81.45458984375, 83.7021484375, 85.94970703125, 88.197265625, 90.44482421875, 92.6923828125, 94.93994140625, 97.1875]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 36.0, 151.0, 460.0, 280.0, 77.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-169.6538848876953, -163.9443359375, -158.23477172851562, -152.5252227783203, -146.815673828125, -141.10610961914062, -135.3965606689453, -129.68701171875, -123.97745513916016, -118.26789855957031, -112.558349609375, -106.84879302978516, -101.13923645019531, -95.4296875, -89.72013092041016, -84.01057434082031, -78.301025390625, -72.59146881103516, -66.88191986083984, -61.17236328125, -55.46281051635742, -49.753257751464844, -44.043701171875, -38.33414840698242, -32.624595642089844, -26.915042877197266, -21.205488204956055, -15.495933532714844, -9.786380767822266, -4.0768280029296875, 1.6327285766601562, 7.342281341552734, 13.051849365234375, 18.761402130126953, 24.470956802368164, 30.180511474609375, 35.89006423950195, 41.59961700439453, 47.309173583984375, 53.01872634887695, 58.72827911376953, 64.43783569335938, 70.14738464355469, 75.85694122314453, 81.56649780273438, 87.27604675292969, 92.98560333251953, 98.69515991210938, 104.40470886230469, 110.11426544189453, 115.82381439208984, 121.53337097167969, 127.242919921875, 132.95248413085938, 138.6620330810547, 144.37158203125, 150.08114624023438, 155.7906951904297, 161.50025939941406, 167.20980834960938, 172.9193572998047, 178.62890625, 184.33847045898438, 190.0480194091797, 195.757568359375]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 4.0, 3.0, 6.0, 7.0, 8.0, 20.0, 14.0, 24.0, 19.0, 18.0, 19.0, 35.0, 44.0, 42.0, 42.0, 53.0, 51.0, 48.0, 38.0, 44.0, 48.0, 47.0, 32.0, 43.0, 23.0, 41.0, 29.0, 32.0, 24.0, 38.0, 21.0, 16.0, 13.0, 15.0, 2.0, 9.0, 10.0, 4.0, 5.0, 7.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.267303466796875, -51.675743103027344, -50.08417892456055, -48.492618560791016, -46.90105438232422, -45.30949401855469, -43.717933654785156, -42.126373291015625, -40.53480911254883, -38.9432487487793, -37.3516845703125, -35.76012420654297, -34.16856384277344, -32.57699966430664, -30.98543930053711, -29.393877029418945, -27.80231475830078, -26.210752487182617, -24.619190216064453, -23.027629852294922, -21.436067581176758, -19.844505310058594, -18.252944946289062, -16.6613826751709, -15.069820404052734, -13.47825813293457, -11.886696815490723, -10.295135498046875, -8.703573226928711, -7.112011432647705, -5.520449638366699, -3.9288883209228516, -2.3373260498046875, -0.7457642555236816, 0.8457975387573242, 2.43735933303833, 4.028921127319336, 5.620482921600342, 7.212044715881348, 8.803606033325195, 10.39516830444336, 11.986730575561523, 13.578291893005371, 15.169853210449219, 16.761415481567383, 18.352977752685547, 19.944538116455078, 21.536100387573242, 23.127662658691406, 24.71922492980957, 26.310787200927734, 27.902347564697266, 29.49390983581543, 31.085472106933594, 32.677032470703125, 34.268592834472656, 35.86015701293945, 37.451717376708984, 39.04328155517578, 40.63484191894531, 42.226402282714844, 43.81796646118164, 45.40952682495117, 47.00109100341797, 48.5926513671875]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 6.0, 7.0, 6.0, 14.0, 8.0, 14.0, 20.0, 22.0, 41.0, 27.0, 35.0, 49.0, 51.0, 37.0, 41.0, 57.0, 55.0, 53.0, 55.0, 50.0, 49.0, 40.0, 48.0, 35.0, 34.0, 28.0, 25.0, 23.0, 24.0, 25.0, 12.0, 3.0, 4.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.37109375, -5.20849609375, -5.0458984375, -4.88330078125, -4.720703125, -4.55810546875, -4.3955078125, -4.23291015625, -4.0703125, -3.90771484375, -3.7451171875, -3.58251953125, -3.419921875, -3.25732421875, -3.0947265625, -2.93212890625, -2.76953125, -2.60693359375, -2.4443359375, -2.28173828125, -2.119140625, -1.95654296875, -1.7939453125, -1.63134765625, -1.46875, -1.30615234375, -1.1435546875, -0.98095703125, -0.818359375, -0.65576171875, -0.4931640625, -0.33056640625, -0.16796875, -0.00537109375, 0.1572265625, 0.31982421875, 0.482421875, 0.64501953125, 0.8076171875, 0.97021484375, 1.1328125, 1.29541015625, 1.4580078125, 1.62060546875, 1.783203125, 1.94580078125, 2.1083984375, 2.27099609375, 2.43359375, 2.59619140625, 2.7587890625, 2.92138671875, 3.083984375, 3.24658203125, 3.4091796875, 3.57177734375, 3.734375, 3.89697265625, 4.0595703125, 4.22216796875, 4.384765625, 4.54736328125, 4.7099609375, 4.87255859375, 5.03515625]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 3.0, 4.0, 6.0, 10.0, 10.0, 23.0, 25.0, 37.0, 63.0, 99.0, 149.0, 189.0, 300.0, 470.0, 723.0, 1155.0, 1642.0, 2769.0, 4415.0, 6930.0, 11315.0, 18100.0, 29291.0, 48200.0, 79185.0, 126807.0, 179916.0, 186340.0, 133353.0, 84004.0, 50657.0, 31157.0, 19255.0, 11853.0, 7508.0, 4510.0, 2835.0, 1842.0, 1213.0, 736.0, 518.0, 313.0, 173.0, 175.0, 102.0, 70.0, 32.0, 27.0, 21.0, 16.0, 8.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.398681640625, -0.3854179382324219, -0.37215423583984375, -0.3588905334472656, -0.3456268310546875, -0.3323631286621094, -0.31909942626953125, -0.3058357238769531, -0.292572021484375, -0.2793083190917969, -0.26604461669921875, -0.2527809143066406, -0.2395172119140625, -0.22625350952148438, -0.21298980712890625, -0.19972610473632812, -0.18646240234375, -0.17319869995117188, -0.15993499755859375, -0.14667129516601562, -0.1334075927734375, -0.12014389038085938, -0.10688018798828125, -0.09361648559570312, -0.080352783203125, -0.06708908081054688, -0.05382537841796875, -0.040561676025390625, -0.0272979736328125, -0.014034271240234375, -0.00077056884765625, 0.012493133544921875, 0.0257568359375, 0.039020538330078125, 0.05228424072265625, 0.06554794311523438, 0.0788116455078125, 0.09207534790039062, 0.10533905029296875, 0.11860275268554688, 0.131866455078125, 0.14513015747070312, 0.15839385986328125, 0.17165756225585938, 0.1849212646484375, 0.19818496704101562, 0.21144866943359375, 0.22471237182617188, 0.23797607421875, 0.2512397766113281, 0.26450347900390625, 0.2777671813964844, 0.2910308837890625, 0.3042945861816406, 0.31755828857421875, 0.3308219909667969, 0.344085693359375, 0.3573493957519531, 0.37061309814453125, 0.3838768005371094, 0.3971405029296875, 0.4104042053222656, 0.42366790771484375, 0.4369316101074219, 0.4501953125]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 3.0, 5.0, 2.0, 7.0, 12.0, 11.0, 12.0, 21.0, 13.0, 16.0, 20.0, 28.0, 48.0, 36.0, 35.0, 49.0, 57.0, 51.0, 41.0, 1070.0, 53.0, 56.0, 53.0, 45.0, 32.0, 30.0, 38.0, 30.0, 27.0, 28.0, 23.0, 24.0, 7.0, 10.0, 9.0, 9.0, 17.0, 1.0, 5.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.328125, -3.231353759765625, -3.13458251953125, -3.037811279296875, -2.9410400390625, -2.844268798828125, -2.74749755859375, -2.650726318359375, -2.553955078125, -2.457183837890625, -2.36041259765625, -2.263641357421875, -2.1668701171875, -2.070098876953125, -1.97332763671875, -1.876556396484375, -1.77978515625, -1.683013916015625, -1.58624267578125, -1.489471435546875, -1.3927001953125, -1.295928955078125, -1.19915771484375, -1.102386474609375, -1.005615234375, -0.908843994140625, -0.81207275390625, -0.715301513671875, -0.6185302734375, -0.521759033203125, -0.42498779296875, -0.328216552734375, -0.2314453125, -0.134674072265625, -0.03790283203125, 0.058868408203125, 0.1556396484375, 0.252410888671875, 0.34918212890625, 0.445953369140625, 0.542724609375, 0.639495849609375, 0.73626708984375, 0.833038330078125, 0.9298095703125, 1.026580810546875, 1.12335205078125, 1.220123291015625, 1.31689453125, 1.413665771484375, 1.51043701171875, 1.607208251953125, 1.7039794921875, 1.800750732421875, 1.89752197265625, 1.994293212890625, 2.091064453125, 2.187835693359375, 2.28460693359375, 2.381378173828125, 2.4781494140625, 2.574920654296875, 2.67169189453125, 2.768463134765625, 2.865234375]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 10.0, 6.0, 16.0, 26.0, 31.0, 55.0, 90.0, 164.0, 262.0, 417.0, 658.0, 1018.0, 1716.0, 2793.0, 4563.0, 7677.0, 12990.0, 21925.0, 37430.0, 63105.0, 101756.0, 151310.0, 1231360.0, 164621.0, 115425.0, 71977.0, 43097.0, 25598.0, 14868.0, 8677.0, 5322.0, 3220.0, 1934.0, 1150.0, 706.0, 417.0, 262.0, 194.0, 93.0, 49.0, 50.0, 29.0, 21.0, 15.0, 13.0, 9.0, 3.0, 3.0, 5.0, 0.0, 4.0], "bins": [-0.363037109375, -0.35285186767578125, -0.3426666259765625, -0.33248138427734375, -0.322296142578125, -0.31211090087890625, -0.3019256591796875, -0.29174041748046875, -0.28155517578125, -0.27136993408203125, -0.2611846923828125, -0.25099945068359375, -0.240814208984375, -0.23062896728515625, -0.2204437255859375, -0.21025848388671875, -0.2000732421875, -0.18988800048828125, -0.1797027587890625, -0.16951751708984375, -0.159332275390625, -0.14914703369140625, -0.1389617919921875, -0.12877655029296875, -0.11859130859375, -0.10840606689453125, -0.0982208251953125, -0.08803558349609375, -0.077850341796875, -0.06766510009765625, -0.0574798583984375, -0.04729461669921875, -0.037109375, -0.02692413330078125, -0.0167388916015625, -0.00655364990234375, 0.003631591796875, 0.01381683349609375, 0.0240020751953125, 0.03418731689453125, 0.04437255859375, 0.05455780029296875, 0.0647430419921875, 0.07492828369140625, 0.085113525390625, 0.09529876708984375, 0.1054840087890625, 0.11566925048828125, 0.1258544921875, 0.13603973388671875, 0.1462249755859375, 0.15641021728515625, 0.166595458984375, 0.17678070068359375, 0.1869659423828125, 0.19715118408203125, 0.20733642578125, 0.21752166748046875, 0.2277069091796875, 0.23789215087890625, 0.248077392578125, 0.25826263427734375, 0.2684478759765625, 0.27863311767578125, 0.288818359375]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 4.0, 0.0, 5.0, 3.0, 7.0, 4.0, 12.0, 17.0, 18.0, 19.0, 25.0, 29.0, 34.0, 44.0, 39.0, 56.0, 48.0, 58.0, 75.0, 64.0, 67.0, 52.0, 47.0, 44.0, 38.0, 29.0, 33.0, 25.0, 24.0, 28.0, 16.0, 13.0, 11.0, 5.0, 7.0, 3.0, 4.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0023345947265625, -0.0022717267274856567, -0.0022088587284088135, -0.00214599072933197, -0.002083122730255127, -0.0020202547311782837, -0.0019573867321014404, -0.0018945187330245972, -0.001831650733947754, -0.0017687827348709106, -0.0017059147357940674, -0.0016430467367172241, -0.0015801787376403809, -0.0015173107385635376, -0.0014544427394866943, -0.001391574740409851, -0.0013287067413330078, -0.0012658387422561646, -0.0012029707431793213, -0.001140102744102478, -0.0010772347450256348, -0.0010143667459487915, -0.0009514987468719482, -0.000888630747795105, -0.0008257627487182617, -0.0007628947496414185, -0.0007000267505645752, -0.0006371587514877319, -0.0005742907524108887, -0.0005114227533340454, -0.00044855475425720215, -0.0003856867551803589, -0.0003228187561035156, -0.00025995075702667236, -0.0001970827579498291, -0.00013421475887298584, -7.134675979614258e-05, -8.478760719299316e-06, 5.4389238357543945e-05, 0.00011725723743438721, 0.00018012523651123047, 0.00024299323558807373, 0.000305861234664917, 0.00036872923374176025, 0.0004315972328186035, 0.0004944652318954468, 0.00055733323097229, 0.0006202012300491333, 0.0006830692291259766, 0.0007459372282028198, 0.0008088052272796631, 0.0008716732263565063, 0.0009345412254333496, 0.0009974092245101929, 0.0010602772235870361, 0.0011231452226638794, 0.0011860132217407227, 0.001248881220817566, 0.0013117492198944092, 0.0013746172189712524, 0.0014374852180480957, 0.001500353217124939, 0.0015632212162017822, 0.0016260892152786255, 0.0016889572143554688]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 5.0, 6.0, 6.0, 12.0, 17.0, 27.0, 34.0, 41.0, 47.0, 70.0, 72.0, 95.0, 130.0, 187.0, 300.0, 598.0, 3586.0, 1026557.0, 14843.0, 751.0, 329.0, 230.0, 129.0, 109.0, 102.0, 82.0, 47.0, 38.0, 24.0, 25.0, 16.0, 7.0, 10.0, 12.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.042236328125, -0.04085731506347656, -0.039478302001953125, -0.03809928894042969, -0.03672027587890625, -0.03534126281738281, -0.033962249755859375, -0.03258323669433594, -0.0312042236328125, -0.029825210571289062, -0.028446197509765625, -0.027067184448242188, -0.02568817138671875, -0.024309158325195312, -0.022930145263671875, -0.021551132202148438, -0.020172119140625, -0.018793106079101562, -0.017414093017578125, -0.016035079956054688, -0.01465606689453125, -0.013277053833007812, -0.011898040771484375, -0.010519027709960938, -0.0091400146484375, -0.0077610015869140625, -0.006381988525390625, -0.0050029754638671875, -0.00362396240234375, -0.0022449493408203125, -0.000865936279296875, 0.0005130767822265625, 0.00189208984375, 0.0032711029052734375, 0.004650115966796875, 0.0060291290283203125, 0.00740814208984375, 0.008787155151367188, 0.010166168212890625, 0.011545181274414062, 0.0129241943359375, 0.014303207397460938, 0.015682220458984375, 0.017061233520507812, 0.01844024658203125, 0.019819259643554688, 0.021198272705078125, 0.022577285766601562, 0.023956298828125, 0.025335311889648438, 0.026714324951171875, 0.028093338012695312, 0.02947235107421875, 0.030851364135742188, 0.032230377197265625, 0.03360939025878906, 0.0349884033203125, 0.03636741638183594, 0.037746429443359375, 0.03912544250488281, 0.04050445556640625, 0.04188346862792969, 0.043262481689453125, 0.04464149475097656, 0.0460205078125]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 524.0, 492.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02187264710664749, -0.02111779898405075, -0.02036294899880886, -0.01960810087621212, -0.01885325089097023, -0.01809840276837349, -0.01734355464577675, -0.01658870466053486, -0.01583385467529297, -0.015079005621373653, -0.014324156567454338, -0.013569308444857597, -0.012814458459615707, -0.012059610337018967, -0.011304761283099651, -0.010549912229180336, -0.009795064106583595, -0.00904021505266428, -0.008285365998744965, -0.007530517410486937, -0.006775668356567621, -0.006020819302648306, -0.005265970714390278, -0.0045111216604709625, -0.003756272606551647, -0.003001423552632332, -0.00224657473154366, -0.0014917259104549885, -0.0007368768565356731, 1.7972197383642197e-05, 0.0007728207856416702, 0.0015276698395609856, 0.00228252075612545, 0.0030373698100447655, 0.003792218631133437, 0.004547067452222109, 0.005301916506141424, 0.0060567655600607395, 0.0068116141483187675, 0.007566463202238083, 0.008321312256157398, 0.009076161310076714, 0.009831010363996029, 0.010585859417915344, 0.011340707540512085, 0.012095557525753975, 0.012850405648350716, 0.013605254702270031, 0.014360103756189346, 0.015114952810108662, 0.015869801864027977, 0.016624649986624718, 0.017379499971866608, 0.01813434809446335, 0.01888919621706009, 0.01964404620230198, 0.02039889618754387, 0.02115374431014061, 0.0219085942953825, 0.02266344241797924, 0.02341829240322113, 0.02417314052581787, 0.024927988648414612, 0.025682838633656502, 0.026437686756253242]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 4.0, 2.0, 3.0, 2.0, 3.0, 6.0, 9.0, 13.0, 9.0, 13.0, 16.0, 22.0, 33.0, 19.0, 32.0, 35.0, 48.0, 59.0, 52.0, 38.0, 50.0, 47.0, 50.0, 68.0, 54.0, 51.0, 31.0, 33.0, 30.0, 37.0, 29.0, 22.0, 18.0, 15.0, 11.0, 15.0, 8.0, 11.0, 4.0, 2.0, 2.0, 2.0, 3.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.000983893871307373, -0.0009442325681447983, -0.0009045712649822235, -0.0008649099618196487, -0.000825248658657074, -0.0007855873554944992, -0.0007459260523319244, -0.0007062647491693497, -0.0006666034460067749, -0.0006269421428442001, -0.0005872808396816254, -0.0005476195365190506, -0.0005079582333564758, -0.00046829693019390106, -0.0004286356270313263, -0.0003889743238687515, -0.00034931302070617676, -0.000309651717543602, -0.0002699904143810272, -0.00023032911121845245, -0.00019066780805587769, -0.00015100650489330292, -0.00011134520173072815, -7.168389856815338e-05, -3.202259540557861e-05, 7.638707756996155e-06, 4.730001091957092e-05, 8.696131408214569e-05, 0.00012662261724472046, 0.00016628392040729523, 0.00020594522356987, 0.00024560652673244476, 0.00028526782989501953, 0.0003249291330575943, 0.00036459043622016907, 0.00040425173938274384, 0.0004439130425453186, 0.00048357434570789337, 0.0005232356488704681, 0.0005628969520330429, 0.0006025582551956177, 0.0006422195583581924, 0.0006818808615207672, 0.000721542164683342, 0.0007612034678459167, 0.0008008647710084915, 0.0008405260741710663, 0.000880187377333641, 0.0009198486804962158, 0.0009595099836587906, 0.0009991712868213654, 0.0010388325899839401, 0.001078493893146515, 0.0011181551963090897, 0.0011578164994716644, 0.0011974778026342392, 0.001237139105796814, 0.0012768004089593887, 0.0013164617121219635, 0.0013561230152845383, 0.001395784318447113, 0.0014354456216096878, 0.0014751069247722626, 0.0015147682279348373, 0.0015544295310974121]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 6.0, 7.0, 6.0, 14.0, 8.0, 14.0, 20.0, 22.0, 41.0, 27.0, 35.0, 49.0, 51.0, 37.0, 41.0, 57.0, 55.0, 53.0, 55.0, 50.0, 49.0, 40.0, 48.0, 35.0, 34.0, 28.0, 25.0, 23.0, 24.0, 25.0, 12.0, 3.0, 4.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.37109375, -5.20849609375, -5.0458984375, -4.88330078125, -4.720703125, -4.55810546875, -4.3955078125, -4.23291015625, -4.0703125, -3.90771484375, -3.7451171875, -3.58251953125, -3.419921875, -3.25732421875, -3.0947265625, -2.93212890625, -2.76953125, -2.60693359375, -2.4443359375, -2.28173828125, -2.119140625, -1.95654296875, -1.7939453125, -1.63134765625, -1.46875, -1.30615234375, -1.1435546875, -0.98095703125, -0.818359375, -0.65576171875, -0.4931640625, -0.33056640625, -0.16796875, -0.00537109375, 0.1572265625, 0.31982421875, 0.482421875, 0.64501953125, 0.8076171875, 0.97021484375, 1.1328125, 1.29541015625, 1.4580078125, 1.62060546875, 1.783203125, 1.94580078125, 2.1083984375, 2.27099609375, 2.43359375, 2.59619140625, 2.7587890625, 2.92138671875, 3.083984375, 3.24658203125, 3.4091796875, 3.57177734375, 3.734375, 3.89697265625, 4.0595703125, 4.22216796875, 4.384765625, 4.54736328125, 4.7099609375, 4.87255859375, 5.03515625]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 4.0, 7.0, 9.0, 7.0, 9.0, 25.0, 26.0, 38.0, 69.0, 112.0, 131.0, 231.0, 328.0, 602.0, 1074.0, 2405.0, 6356.0, 23466.0, 104769.0, 502465.0, 320371.0, 62366.0, 14984.0, 4629.0, 1797.0, 882.0, 460.0, 344.0, 225.0, 131.0, 74.0, 57.0, 34.0, 32.0, 13.0, 12.0, 7.0, 5.0, 1.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.2109375, -5.05224609375, -4.8935546875, -4.73486328125, -4.576171875, -4.41748046875, -4.2587890625, -4.10009765625, -3.94140625, -3.78271484375, -3.6240234375, -3.46533203125, -3.306640625, -3.14794921875, -2.9892578125, -2.83056640625, -2.671875, -2.51318359375, -2.3544921875, -2.19580078125, -2.037109375, -1.87841796875, -1.7197265625, -1.56103515625, -1.40234375, -1.24365234375, -1.0849609375, -0.92626953125, -0.767578125, -0.60888671875, -0.4501953125, -0.29150390625, -0.1328125, 0.02587890625, 0.1845703125, 0.34326171875, 0.501953125, 0.66064453125, 0.8193359375, 0.97802734375, 1.13671875, 1.29541015625, 1.4541015625, 1.61279296875, 1.771484375, 1.93017578125, 2.0888671875, 2.24755859375, 2.40625, 2.56494140625, 2.7236328125, 2.88232421875, 3.041015625, 3.19970703125, 3.3583984375, 3.51708984375, 3.67578125, 3.83447265625, 3.9931640625, 4.15185546875, 4.310546875, 4.46923828125, 4.6279296875, 4.78662109375, 4.9453125]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 7.0, 4.0, 4.0, 4.0, 5.0, 6.0, 16.0, 16.0, 13.0, 9.0, 18.0, 21.0, 25.0, 26.0, 34.0, 39.0, 28.0, 37.0, 42.0, 52.0, 60.0, 147.0, 1772.0, 196.0, 75.0, 50.0, 36.0, 28.0, 31.0, 30.0, 35.0, 30.0, 32.0, 18.0, 12.0, 20.0, 16.0, 8.0, 13.0, 6.0, 8.0, 5.0, 7.0, 1.0, 4.0, 3.0, 2.0, 4.0, 0.0, 2.0], "bins": [-16.265625, -15.8212890625, -15.376953125, -14.9326171875, -14.48828125, -14.0439453125, -13.599609375, -13.1552734375, -12.7109375, -12.2666015625, -11.822265625, -11.3779296875, -10.93359375, -10.4892578125, -10.044921875, -9.6005859375, -9.15625, -8.7119140625, -8.267578125, -7.8232421875, -7.37890625, -6.9345703125, -6.490234375, -6.0458984375, -5.6015625, -5.1572265625, -4.712890625, -4.2685546875, -3.82421875, -3.3798828125, -2.935546875, -2.4912109375, -2.046875, -1.6025390625, -1.158203125, -0.7138671875, -0.26953125, 0.1748046875, 0.619140625, 1.0634765625, 1.5078125, 1.9521484375, 2.396484375, 2.8408203125, 3.28515625, 3.7294921875, 4.173828125, 4.6181640625, 5.0625, 5.5068359375, 5.951171875, 6.3955078125, 6.83984375, 7.2841796875, 7.728515625, 8.1728515625, 8.6171875, 9.0615234375, 9.505859375, 9.9501953125, 10.39453125, 10.8388671875, 11.283203125, 11.7275390625, 12.171875]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [5.0, 2.0, 4.0, 4.0, 1.0, 7.0, 6.0, 3.0, 5.0, 10.0, 14.0, 11.0, 10.0, 19.0, 9.0, 21.0, 28.0, 34.0, 30.0, 48.0, 45.0, 71.0, 110.0, 205.0, 430.0, 1472.0, 29980.0, 3098407.0, 12455.0, 1182.0, 415.0, 178.0, 103.0, 69.0, 51.0, 53.0, 34.0, 24.0, 32.0, 19.0, 17.0, 14.0, 16.0, 8.0, 12.0, 15.0, 8.0, 1.0, 3.0, 5.0, 4.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-25.296875, -24.374267578125, -23.45166015625, -22.529052734375, -21.6064453125, -20.683837890625, -19.76123046875, -18.838623046875, -17.916015625, -16.993408203125, -16.07080078125, -15.148193359375, -14.2255859375, -13.302978515625, -12.38037109375, -11.457763671875, -10.53515625, -9.612548828125, -8.68994140625, -7.767333984375, -6.8447265625, -5.922119140625, -4.99951171875, -4.076904296875, -3.154296875, -2.231689453125, -1.30908203125, -0.386474609375, 0.5361328125, 1.458740234375, 2.38134765625, 3.303955078125, 4.2265625, 5.149169921875, 6.07177734375, 6.994384765625, 7.9169921875, 8.839599609375, 9.76220703125, 10.684814453125, 11.607421875, 12.530029296875, 13.45263671875, 14.375244140625, 15.2978515625, 16.220458984375, 17.14306640625, 18.065673828125, 18.98828125, 19.910888671875, 20.83349609375, 21.756103515625, 22.6787109375, 23.601318359375, 24.52392578125, 25.446533203125, 26.369140625, 27.291748046875, 28.21435546875, 29.136962890625, 30.0595703125, 30.982177734375, 31.90478515625, 32.827392578125, 33.75]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [19.0, 408.0, 574.0, 16.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.012465476989746, -2.6173341274261475, -0.22220277786254883, 2.172928810119629, 4.568059921264648, 6.963191032409668, 9.358323097229004, 11.753453254699707, 14.148585319519043, 16.543716430664062, 18.9388484954834, 21.333980560302734, 23.729110717773438, 26.12424087524414, 28.51937484741211, 30.914505004882812, 33.309635162353516, 35.70476531982422, 38.09989929199219, 40.49502944946289, 42.890159606933594, 45.28529357910156, 47.680423736572266, 50.07555389404297, 52.47068786621094, 54.86581802368164, 57.26095199584961, 59.65608215332031, 62.051212310791016, 64.44634246826172, 66.84147644042969, 69.23660278320312, 71.6317367553711, 74.02687072753906, 76.4219970703125, 78.81713104248047, 81.21226501464844, 83.60739135742188, 86.00252532958984, 88.39765930175781, 90.79278564453125, 93.18791961669922, 95.58304595947266, 97.97817993164062, 100.3733139038086, 102.76844024658203, 105.16357421875, 107.55870056152344, 109.95384216308594, 112.3489761352539, 114.74410247802734, 117.13923645019531, 119.53437042236328, 121.92949676513672, 124.32463073730469, 126.71975708007812, 129.11488342285156, 131.510009765625, 133.9051513671875, 136.30027770996094, 138.69540405273438, 141.09054565429688, 143.4856719970703, 145.88079833984375, 148.27593994140625]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 14.0, 9.0, 7.0, 12.0, 17.0, 21.0, 21.0, 28.0, 29.0, 28.0, 27.0, 26.0, 46.0, 42.0, 62.0, 48.0, 38.0, 47.0, 49.0, 52.0, 51.0, 43.0, 35.0, 35.0, 39.0, 31.0, 27.0, 15.0, 16.0, 16.0, 9.0, 14.0, 13.0, 12.0, 8.0, 5.0, 6.0, 1.0, 4.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.16040802001953, -45.56102752685547, -43.961647033691406, -42.362266540527344, -40.76288604736328, -39.16350555419922, -37.564125061035156, -35.964744567871094, -34.36536407470703, -32.76598358154297, -31.166603088378906, -29.567222595214844, -27.96784210205078, -26.36846160888672, -24.769079208374023, -23.16969871520996, -21.570316314697266, -19.970935821533203, -18.37155532836914, -16.772174835205078, -15.1727933883667, -13.573412895202637, -11.974031448364258, -10.374650955200195, -8.775270462036133, -7.17588996887207, -5.57650899887085, -3.977128028869629, -2.3777475357055664, -0.7783670425415039, 0.821014404296875, 2.4203948974609375, 4.019775390625, 5.6191558837890625, 7.218536853790283, 8.817917823791504, 10.417298316955566, 12.016678810119629, 13.616060256958008, 15.21544075012207, 16.814821243286133, 18.414201736450195, 20.013582229614258, 21.612964630126953, 23.212345123291016, 24.811725616455078, 26.41110610961914, 28.010486602783203, 29.609867095947266, 31.209247589111328, 32.80862808227539, 34.40800857543945, 36.007389068603516, 37.60676956176758, 39.206153869628906, 40.80553436279297, 42.40491485595703, 44.004295349121094, 45.603675842285156, 47.20305633544922, 48.80243682861328, 50.401817321777344, 52.001197814941406, 53.60057830810547, 55.19995880126953]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 7.0, 4.0, 5.0, 8.0, 16.0, 9.0, 14.0, 24.0, 25.0, 34.0, 31.0, 47.0, 42.0, 49.0, 34.0, 46.0, 54.0, 59.0, 41.0, 66.0, 61.0, 36.0, 40.0, 46.0, 34.0, 32.0, 32.0, 18.0, 22.0, 27.0, 19.0, 12.0, 5.0, 3.0, 7.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.2890625, -5.122802734375, -4.95654296875, -4.790283203125, -4.6240234375, -4.457763671875, -4.29150390625, -4.125244140625, -3.958984375, -3.792724609375, -3.62646484375, -3.460205078125, -3.2939453125, -3.127685546875, -2.96142578125, -2.795166015625, -2.62890625, -2.462646484375, -2.29638671875, -2.130126953125, -1.9638671875, -1.797607421875, -1.63134765625, -1.465087890625, -1.298828125, -1.132568359375, -0.96630859375, -0.800048828125, -0.6337890625, -0.467529296875, -0.30126953125, -0.135009765625, 0.03125, 0.197509765625, 0.36376953125, 0.530029296875, 0.6962890625, 0.862548828125, 1.02880859375, 1.195068359375, 1.361328125, 1.527587890625, 1.69384765625, 1.860107421875, 2.0263671875, 2.192626953125, 2.35888671875, 2.525146484375, 2.69140625, 2.857666015625, 3.02392578125, 3.190185546875, 3.3564453125, 3.522705078125, 3.68896484375, 3.855224609375, 4.021484375, 4.187744140625, 4.35400390625, 4.520263671875, 4.6865234375, 4.852783203125, 5.01904296875, 5.185302734375, 5.3515625]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 7.0, 2.0, 3.0, 10.0, 5.0, 13.0, 12.0, 19.0, 25.0, 39.0, 49.0, 52.0, 94.0, 138.0, 298.0, 832.0, 3017.0, 19772.0, 366154.0, 3563850.0, 221603.0, 14459.0, 2437.0, 708.0, 260.0, 143.0, 67.0, 54.0, 48.0, 32.0, 20.0, 21.0, 20.0, 6.0, 6.0, 5.0, 7.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.453125, -21.801025390625, -21.14892578125, -20.496826171875, -19.8447265625, -19.192626953125, -18.54052734375, -17.888427734375, -17.236328125, -16.584228515625, -15.93212890625, -15.280029296875, -14.6279296875, -13.975830078125, -13.32373046875, -12.671630859375, -12.01953125, -11.367431640625, -10.71533203125, -10.063232421875, -9.4111328125, -8.759033203125, -8.10693359375, -7.454833984375, -6.802734375, -6.150634765625, -5.49853515625, -4.846435546875, -4.1943359375, -3.542236328125, -2.89013671875, -2.238037109375, -1.5859375, -0.933837890625, -0.28173828125, 0.370361328125, 1.0224609375, 1.674560546875, 2.32666015625, 2.978759765625, 3.630859375, 4.282958984375, 4.93505859375, 5.587158203125, 6.2392578125, 6.891357421875, 7.54345703125, 8.195556640625, 8.84765625, 9.499755859375, 10.15185546875, 10.803955078125, 11.4560546875, 12.108154296875, 12.76025390625, 13.412353515625, 14.064453125, 14.716552734375, 15.36865234375, 16.020751953125, 16.6728515625, 17.324951171875, 17.97705078125, 18.629150390625, 19.28125]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 10.0, 8.0, 11.0, 25.0, 29.0, 51.0, 99.0, 138.0, 198.0, 332.0, 473.0, 606.0, 659.0, 485.0, 361.0, 221.0, 118.0, 98.0, 56.0, 36.0, 26.0, 16.0, 10.0, 7.0, 2.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.046875, -17.44677734375, -16.8466796875, -16.24658203125, -15.646484375, -15.04638671875, -14.4462890625, -13.84619140625, -13.24609375, -12.64599609375, -12.0458984375, -11.44580078125, -10.845703125, -10.24560546875, -9.6455078125, -9.04541015625, -8.4453125, -7.84521484375, -7.2451171875, -6.64501953125, -6.044921875, -5.44482421875, -4.8447265625, -4.24462890625, -3.64453125, -3.04443359375, -2.4443359375, -1.84423828125, -1.244140625, -0.64404296875, -0.0439453125, 0.55615234375, 1.15625, 1.75634765625, 2.3564453125, 2.95654296875, 3.556640625, 4.15673828125, 4.7568359375, 5.35693359375, 5.95703125, 6.55712890625, 7.1572265625, 7.75732421875, 8.357421875, 8.95751953125, 9.5576171875, 10.15771484375, 10.7578125, 11.35791015625, 11.9580078125, 12.55810546875, 13.158203125, 13.75830078125, 14.3583984375, 14.95849609375, 15.55859375, 16.15869140625, 16.7587890625, 17.35888671875, 17.958984375, 18.55908203125, 19.1591796875, 19.75927734375, 20.359375]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 6.0, 9.0, 23.0, 22.0, 41.0, 83.0, 120.0, 231.0, 383.0, 985.0, 4300.0, 70229.0, 3707947.0, 396397.0, 10611.0, 1601.0, 596.0, 304.0, 135.0, 84.0, 63.0, 32.0, 34.0, 14.0, 7.0, 8.0, 4.0, 1.0, 2.0, 5.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.875, -32.44580078125, -31.0166015625, -29.58740234375, -28.158203125, -26.72900390625, -25.2998046875, -23.87060546875, -22.44140625, -21.01220703125, -19.5830078125, -18.15380859375, -16.724609375, -15.29541015625, -13.8662109375, -12.43701171875, -11.0078125, -9.57861328125, -8.1494140625, -6.72021484375, -5.291015625, -3.86181640625, -2.4326171875, -1.00341796875, 0.42578125, 1.85498046875, 3.2841796875, 4.71337890625, 6.142578125, 7.57177734375, 9.0009765625, 10.43017578125, 11.859375, 13.28857421875, 14.7177734375, 16.14697265625, 17.576171875, 19.00537109375, 20.4345703125, 21.86376953125, 23.29296875, 24.72216796875, 26.1513671875, 27.58056640625, 29.009765625, 30.43896484375, 31.8681640625, 33.29736328125, 34.7265625, 36.15576171875, 37.5849609375, 39.01416015625, 40.443359375, 41.87255859375, 43.3017578125, 44.73095703125, 46.16015625, 47.58935546875, 49.0185546875, 50.44775390625, 51.876953125, 53.30615234375, 54.7353515625, 56.16455078125, 57.59375]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 31.0, 232.0, 461.0, 243.0, 42.0, 6.0, 0.0, 1.0], "bins": [-401.98382568359375, -395.11151123046875, -388.2391662597656, -381.3668518066406, -374.4945068359375, -367.6221923828125, -360.7498779296875, -353.8775329589844, -347.0052185058594, -340.1329040527344, -333.26055908203125, -326.38824462890625, -319.5158996582031, -312.6435852050781, -305.771240234375, -298.89892578125, -292.026611328125, -285.154296875, -278.2819519042969, -271.4096374511719, -264.53729248046875, -257.66497802734375, -250.7926483154297, -243.92031860351562, -237.0479736328125, -230.17564392089844, -223.30331420898438, -216.43099975585938, -209.5586700439453, -202.68634033203125, -195.8140106201172, -188.94168090820312, -182.06936645507812, -175.19703674316406, -168.32470703125, -161.452392578125, -154.58006286621094, -147.70773315429688, -140.8354034423828, -133.96307373046875, -127.09074401855469, -120.21841430664062, -113.3460922241211, -106.47376251220703, -99.6014404296875, -92.72911071777344, -85.85678100585938, -78.98445129394531, -72.11212921142578, -65.23979949951172, -58.36747741699219, -51.495147705078125, -44.62282180786133, -37.75049591064453, -30.87816619873047, -24.005840301513672, -17.133514404296875, -10.261187553405762, -3.3888607025146484, 3.4834671020507812, 10.355792999267578, 17.228118896484375, 24.100448608398438, 30.972774505615234, 37.84510040283203]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 2.0, 5.0, 0.0, 6.0, 4.0, 8.0, 10.0, 9.0, 15.0, 4.0, 10.0, 12.0, 9.0, 18.0, 13.0, 26.0, 26.0, 17.0, 26.0, 25.0, 42.0, 28.0, 33.0, 34.0, 16.0, 44.0, 32.0, 25.0, 34.0, 44.0, 33.0, 42.0, 22.0, 36.0, 32.0, 18.0, 25.0, 25.0, 21.0, 22.0, 21.0, 22.0, 12.0, 13.0, 12.0, 6.0, 8.0, 10.0, 13.0, 11.0, 5.0, 6.0, 7.0, 5.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 3.0], "bins": [-35.4333381652832, -34.29182434082031, -33.150306701660156, -32.008792877197266, -30.867279052734375, -29.72576332092285, -28.584247589111328, -27.442733764648438, -26.301218032836914, -25.15970230102539, -24.0181884765625, -22.876672744750977, -21.735157012939453, -20.593643188476562, -19.45212745666504, -18.310611724853516, -17.169097900390625, -16.0275821685791, -14.886068344116211, -13.744552612304688, -12.60303783416748, -11.461523056030273, -10.32000732421875, -9.178492546081543, -8.036977767944336, -6.895462989807129, -5.753947734832764, -4.612432479858398, -3.4709177017211914, -2.3294029235839844, -1.1878876686096191, -0.046372413635253906, 1.0951461791992188, 2.236661195755005, 3.378176212310791, 4.519691467285156, 5.661206245422363, 6.80272102355957, 7.9442362785339355, 9.0857515335083, 10.227266311645508, 11.368781089782715, 12.510295867919922, 13.651811599731445, 14.793326377868652, 15.93484115600586, 17.076356887817383, 18.217872619628906, 19.359386444091797, 20.50090217590332, 21.64241600036621, 22.783931732177734, 23.925445556640625, 25.06696128845215, 26.208477020263672, 27.349990844726562, 28.491506576538086, 29.63302230834961, 30.7745361328125, 31.916051864624023, 33.05756759643555, 34.19908142089844, 35.34059524536133, 36.482112884521484, 37.623626708984375]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 6.0, 1.0, 9.0, 11.0, 10.0, 16.0, 14.0, 24.0, 17.0, 23.0, 28.0, 19.0, 28.0, 42.0, 39.0, 31.0, 42.0, 51.0, 46.0, 48.0, 47.0, 38.0, 44.0, 47.0, 45.0, 29.0, 38.0, 21.0, 28.0, 30.0, 29.0, 22.0, 13.0, 13.0, 12.0, 8.0, 15.0, 6.0, 7.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0625, -3.9215087890625, -3.780517578125, -3.6395263671875, -3.49853515625, -3.3575439453125, -3.216552734375, -3.0755615234375, -2.9345703125, -2.7935791015625, -2.652587890625, -2.5115966796875, -2.37060546875, -2.2296142578125, -2.088623046875, -1.9476318359375, -1.806640625, -1.6656494140625, -1.524658203125, -1.3836669921875, -1.24267578125, -1.1016845703125, -0.960693359375, -0.8197021484375, -0.6787109375, -0.5377197265625, -0.396728515625, -0.2557373046875, -0.11474609375, 0.0262451171875, 0.167236328125, 0.3082275390625, 0.44921875, 0.5902099609375, 0.731201171875, 0.8721923828125, 1.01318359375, 1.1541748046875, 1.295166015625, 1.4361572265625, 1.5771484375, 1.7181396484375, 1.859130859375, 2.0001220703125, 2.14111328125, 2.2821044921875, 2.423095703125, 2.5640869140625, 2.705078125, 2.8460693359375, 2.987060546875, 3.1280517578125, 3.26904296875, 3.4100341796875, 3.551025390625, 3.6920166015625, 3.8330078125, 3.9739990234375, 4.114990234375, 4.2559814453125, 4.39697265625, 4.5379638671875, 4.678955078125, 4.8199462890625, 4.9609375]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 5.0, 7.0, 8.0, 14.0, 21.0, 29.0, 49.0, 66.0, 86.0, 160.0, 175.0, 274.0, 420.0, 599.0, 855.0, 1381.0, 1958.0, 2964.0, 4537.0, 6884.0, 10491.0, 16619.0, 26619.0, 42629.0, 70017.0, 114301.0, 170342.0, 193117.0, 143829.0, 90858.0, 55500.0, 34051.0, 20778.0, 13464.0, 8534.0, 5580.0, 3717.0, 2494.0, 1644.0, 1079.0, 687.0, 526.0, 397.0, 209.0, 170.0, 130.0, 97.0, 74.0, 29.0, 18.0, 15.0, 30.0, 12.0, 13.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.453369140625, -0.4397392272949219, -0.42610931396484375, -0.4124794006347656, -0.3988494873046875, -0.3852195739746094, -0.37158966064453125, -0.3579597473144531, -0.344329833984375, -0.3306999206542969, -0.31707000732421875, -0.3034400939941406, -0.2898101806640625, -0.2761802673339844, -0.26255035400390625, -0.24892044067382812, -0.23529052734375, -0.22166061401367188, -0.20803070068359375, -0.19440078735351562, -0.1807708740234375, -0.16714096069335938, -0.15351104736328125, -0.13988113403320312, -0.126251220703125, -0.11262130737304688, -0.09899139404296875, -0.08536148071289062, -0.0717315673828125, -0.058101654052734375, -0.04447174072265625, -0.030841827392578125, -0.0172119140625, -0.003582000732421875, 0.01004791259765625, 0.023677825927734375, 0.0373077392578125, 0.050937652587890625, 0.06456756591796875, 0.07819747924804688, 0.091827392578125, 0.10545730590820312, 0.11908721923828125, 0.13271713256835938, 0.1463470458984375, 0.15997695922851562, 0.17360687255859375, 0.18723678588867188, 0.20086669921875, 0.21449661254882812, 0.22812652587890625, 0.24175643920898438, 0.2553863525390625, 0.2690162658691406, 0.28264617919921875, 0.2962760925292969, 0.309906005859375, 0.3235359191894531, 0.33716583251953125, 0.3507957458496094, 0.3644256591796875, 0.3780555725097656, 0.39168548583984375, 0.4053153991699219, 0.4189453125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 3.0, 2.0, 5.0, 5.0, 7.0, 9.0, 10.0, 14.0, 12.0, 16.0, 11.0, 11.0, 24.0, 23.0, 16.0, 25.0, 32.0, 32.0, 25.0, 25.0, 38.0, 40.0, 52.0, 35.0, 1069.0, 34.0, 37.0, 33.0, 34.0, 34.0, 42.0, 34.0, 27.0, 43.0, 30.0, 21.0, 23.0, 10.0, 12.0, 8.0, 11.0, 18.0, 4.0, 4.0, 10.0, 8.0, 3.0, 6.0, 1.0, 3.0, 1.0, 2.0, 1.0, 4.0], "bins": [-2.74609375, -2.667266845703125, -2.58843994140625, -2.509613037109375, -2.4307861328125, -2.351959228515625, -2.27313232421875, -2.194305419921875, -2.115478515625, -2.036651611328125, -1.95782470703125, -1.878997802734375, -1.8001708984375, -1.721343994140625, -1.64251708984375, -1.563690185546875, -1.48486328125, -1.406036376953125, -1.32720947265625, -1.248382568359375, -1.1695556640625, -1.090728759765625, -1.01190185546875, -0.933074951171875, -0.854248046875, -0.775421142578125, -0.69659423828125, -0.617767333984375, -0.5389404296875, -0.460113525390625, -0.38128662109375, -0.302459716796875, -0.2236328125, -0.144805908203125, -0.06597900390625, 0.012847900390625, 0.0916748046875, 0.170501708984375, 0.24932861328125, 0.328155517578125, 0.406982421875, 0.485809326171875, 0.56463623046875, 0.643463134765625, 0.7222900390625, 0.801116943359375, 0.87994384765625, 0.958770751953125, 1.03759765625, 1.116424560546875, 1.19525146484375, 1.274078369140625, 1.3529052734375, 1.431732177734375, 1.51055908203125, 1.589385986328125, 1.668212890625, 1.747039794921875, 1.82586669921875, 1.904693603515625, 1.9835205078125, 2.062347412109375, 2.14117431640625, 2.220001220703125, 2.298828125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 4.0, 5.0, 5.0, 18.0, 30.0, 25.0, 50.0, 90.0, 137.0, 195.0, 330.0, 588.0, 820.0, 1293.0, 2125.0, 3356.0, 4986.0, 8003.0, 12510.0, 19494.0, 30383.0, 46139.0, 70379.0, 102728.0, 138598.0, 1205070.0, 140136.0, 104518.0, 72107.0, 46951.0, 30606.0, 19909.0, 12559.0, 8246.0, 5247.0, 3467.0, 2195.0, 1386.0, 918.0, 541.0, 365.0, 211.0, 146.0, 103.0, 45.0, 35.0, 34.0, 14.0, 13.0, 7.0, 6.0, 3.0, 2.0, 2.0, 2.0], "bins": [-0.332275390625, -0.3226509094238281, -0.31302642822265625, -0.3034019470214844, -0.2937774658203125, -0.2841529846191406, -0.27452850341796875, -0.2649040222167969, -0.255279541015625, -0.24565505981445312, -0.23603057861328125, -0.22640609741210938, -0.2167816162109375, -0.20715713500976562, -0.19753265380859375, -0.18790817260742188, -0.17828369140625, -0.16865921020507812, -0.15903472900390625, -0.14941024780273438, -0.1397857666015625, -0.13016128540039062, -0.12053680419921875, -0.11091232299804688, -0.101287841796875, -0.09166336059570312, -0.08203887939453125, -0.07241439819335938, -0.0627899169921875, -0.053165435791015625, -0.04354095458984375, -0.033916473388671875, -0.0242919921875, -0.014667510986328125, -0.00504302978515625, 0.004581451416015625, 0.0142059326171875, 0.023830413818359375, 0.03345489501953125, 0.043079376220703125, 0.052703857421875, 0.062328338623046875, 0.07195281982421875, 0.08157730102539062, 0.0912017822265625, 0.10082626342773438, 0.11045074462890625, 0.12007522583007812, 0.12969970703125, 0.13932418823242188, 0.14894866943359375, 0.15857315063476562, 0.1681976318359375, 0.17782211303710938, 0.18744659423828125, 0.19707107543945312, 0.206695556640625, 0.21632003784179688, 0.22594451904296875, 0.23556900024414062, 0.2451934814453125, 0.2548179626464844, 0.26444244384765625, 0.2740669250488281, 0.28369140625]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 7.0, 3.0, 7.0, 12.0, 12.0, 19.0, 18.0, 37.0, 41.0, 51.0, 55.0, 81.0, 99.0, 94.0, 81.0, 83.0, 71.0, 52.0, 48.0, 38.0, 18.0, 11.0, 15.0, 13.0, 6.0, 7.0, 4.0, 10.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00237274169921875, -0.0022725462913513184, -0.0021723508834838867, -0.002072155475616455, -0.0019719600677490234, -0.0018717646598815918, -0.0017715692520141602, -0.0016713738441467285, -0.0015711784362792969, -0.0014709830284118652, -0.0013707876205444336, -0.001270592212677002, -0.0011703968048095703, -0.0010702013969421387, -0.000970005989074707, -0.0008698105812072754, -0.0007696151733398438, -0.0006694197654724121, -0.0005692243576049805, -0.00046902894973754883, -0.0003688335418701172, -0.00026863813400268555, -0.0001684427261352539, -6.824731826782227e-05, 3.1948089599609375e-05, 0.00013214349746704102, 0.00023233890533447266, 0.0003325343132019043, 0.00043272972106933594, 0.0005329251289367676, 0.0006331205368041992, 0.0007333159446716309, 0.0008335113525390625, 0.0009337067604064941, 0.0010339021682739258, 0.0011340975761413574, 0.001234292984008789, 0.0013344883918762207, 0.0014346837997436523, 0.001534879207611084, 0.0016350746154785156, 0.0017352700233459473, 0.001835465431213379, 0.0019356608390808105, 0.002035856246948242, 0.002136051654815674, 0.0022362470626831055, 0.002336442470550537, 0.0024366378784179688, 0.0025368332862854004, 0.002637028694152832, 0.0027372241020202637, 0.0028374195098876953, 0.002937614917755127, 0.0030378103256225586, 0.0031380057334899902, 0.003238201141357422, 0.0033383965492248535, 0.003438591957092285, 0.003538787364959717, 0.0036389827728271484, 0.00373917818069458, 0.0038393735885620117, 0.003939568996429443, 0.004039764404296875]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 3.0, 8.0, 10.0, 6.0, 14.0, 35.0, 41.0, 34.0, 72.0, 101.0, 141.0, 260.0, 411.0, 1099.0, 904138.0, 140365.0, 791.0, 351.0, 246.0, 132.0, 88.0, 43.0, 45.0, 44.0, 20.0, 11.0, 11.0, 10.0, 7.0, 5.0, 7.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0], "bins": [-0.08294677734375, -0.08091878890991211, -0.07889080047607422, -0.07686281204223633, -0.07483482360839844, -0.07280683517456055, -0.07077884674072266, -0.06875085830688477, -0.06672286987304688, -0.06469488143920898, -0.0626668930053711, -0.0606389045715332, -0.05861091613769531, -0.05658292770385742, -0.05455493927001953, -0.05252695083618164, -0.05049896240234375, -0.04847097396850586, -0.04644298553466797, -0.04441499710083008, -0.04238700866699219, -0.0403590202331543, -0.038331031799316406, -0.036303043365478516, -0.034275054931640625, -0.032247066497802734, -0.030219078063964844, -0.028191089630126953, -0.026163101196289062, -0.024135112762451172, -0.02210712432861328, -0.02007913589477539, -0.0180511474609375, -0.01602315902709961, -0.013995170593261719, -0.011967182159423828, -0.009939193725585938, -0.007911205291748047, -0.005883216857910156, -0.0038552284240722656, -0.001827239990234375, 0.00020074844360351562, 0.0022287368774414062, 0.004256725311279297, 0.0062847137451171875, 0.008312702178955078, 0.010340690612792969, 0.01236867904663086, 0.01439666748046875, 0.01642465591430664, 0.01845264434814453, 0.020480632781982422, 0.022508621215820312, 0.024536609649658203, 0.026564598083496094, 0.028592586517333984, 0.030620574951171875, 0.032648563385009766, 0.034676551818847656, 0.03670454025268555, 0.03873252868652344, 0.04076051712036133, 0.04278850555419922, 0.04481649398803711, 0.046844482421875]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 1008.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.051476843655109406, -0.05020083114504814, -0.04892481863498688, -0.04764880612492561, -0.04637279361486435, -0.04509677737951279, -0.04382076486945152, -0.04254475235939026, -0.041268739849328995, -0.03999272733926773, -0.03871671482920647, -0.0374407023191452, -0.03616468608379364, -0.034888673573732376, -0.03361266106367111, -0.03233664855360985, -0.031060636043548584, -0.02978462353348732, -0.028508611023426056, -0.027232596650719643, -0.02595658414065838, -0.024680571630597115, -0.0234045572578907, -0.022128544747829437, -0.020852532237768173, -0.01957651972770691, -0.018300507217645645, -0.017024492844939232, -0.015748480334877968, -0.014472467824816704, -0.013196454383432865, -0.011920440942049026, -0.010644424706697464, -0.0093684121966362, -0.008092398755252361, -0.00681638577952981, -0.005540372803807259, -0.004264359828084707, -0.002988346852362156, -0.0017123334109783173, -0.0004363209009170532, 0.0008396920748054981, 0.0021157050505280495, 0.003391718026250601, 0.004667731001973152, 0.0059437439776957035, 0.007219756953418255, 0.008495770394802094, 0.009771782904863358, 0.011047795414924622, 0.01232380885630846, 0.013599822297692299, 0.014875834807753563, 0.016151847317814827, 0.01742786169052124, 0.018703874200582504, 0.01997988671064377, 0.021255899220705032, 0.022531911730766296, 0.02380792610347271, 0.025083938613533974, 0.026359951123595238, 0.02763596549630165, 0.028911978006362915, 0.03018799051642418]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 8.0, 12.0, 15.0, 20.0, 19.0, 32.0, 25.0, 44.0, 45.0, 57.0, 55.0, 51.0, 64.0, 71.0, 76.0, 81.0, 66.0, 52.0, 45.0, 36.0, 24.0, 30.0, 17.0, 29.0, 15.0, 7.0, 9.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015898346900939941, -0.0015199529007077217, -0.0014500711113214493, -0.0013801893219351768, -0.0013103075325489044, -0.001240425743162632, -0.0011705439537763596, -0.0011006621643900871, -0.0010307803750038147, -0.0009608985856175423, -0.0008910167962312698, -0.0008211350068449974, -0.000751253217458725, -0.0006813714280724525, -0.0006114896386861801, -0.0005416078492999077, -0.00047172605991363525, -0.0004018442705273628, -0.0003319624811410904, -0.00026208069175481796, -0.00019219890236854553, -0.0001223171129822731, -5.243532359600067e-05, 1.744646579027176e-05, 8.732825517654419e-05, 0.00015721004456281662, 0.00022709183394908905, 0.0002969736233353615, 0.0003668554127216339, 0.00043673720210790634, 0.0005066189914941788, 0.0005765007808804512, 0.0006463825702667236, 0.0007162643596529961, 0.0007861461490392685, 0.0008560279384255409, 0.0009259097278118134, 0.0009957915171980858, 0.0010656733065843582, 0.0011355550959706306, 0.001205436885356903, 0.0012753186747431755, 0.001345200464129448, 0.0014150822535157204, 0.0014849640429019928, 0.0015548458322882652, 0.0016247276216745377, 0.00169460941106081, 0.0017644912004470825, 0.001834372989833355, 0.0019042547792196274, 0.0019741365686059, 0.0020440183579921722, 0.0021139001473784447, 0.002183781936764717, 0.0022536637261509895, 0.002323545515537262, 0.0023934273049235344, 0.002463309094309807, 0.0025331908836960793, 0.0026030726730823517, 0.002672954462468624, 0.0027428362518548965, 0.002812718041241169, 0.0028825998306274414]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 6.0, 1.0, 9.0, 11.0, 10.0, 16.0, 14.0, 24.0, 17.0, 23.0, 28.0, 19.0, 28.0, 42.0, 39.0, 31.0, 42.0, 51.0, 46.0, 48.0, 47.0, 38.0, 44.0, 47.0, 45.0, 29.0, 38.0, 21.0, 28.0, 30.0, 29.0, 22.0, 13.0, 13.0, 12.0, 8.0, 15.0, 6.0, 7.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0625, -3.9215087890625, -3.780517578125, -3.6395263671875, -3.49853515625, -3.3575439453125, -3.216552734375, -3.0755615234375, -2.9345703125, -2.7935791015625, -2.652587890625, -2.5115966796875, -2.37060546875, -2.2296142578125, -2.088623046875, -1.9476318359375, -1.806640625, -1.6656494140625, -1.524658203125, -1.3836669921875, -1.24267578125, -1.1016845703125, -0.960693359375, -0.8197021484375, -0.6787109375, -0.5377197265625, -0.396728515625, -0.2557373046875, -0.11474609375, 0.0262451171875, 0.167236328125, 0.3082275390625, 0.44921875, 0.5902099609375, 0.731201171875, 0.8721923828125, 1.01318359375, 1.1541748046875, 1.295166015625, 1.4361572265625, 1.5771484375, 1.7181396484375, 1.859130859375, 2.0001220703125, 2.14111328125, 2.2821044921875, 2.423095703125, 2.5640869140625, 2.705078125, 2.8460693359375, 2.987060546875, 3.1280517578125, 3.26904296875, 3.4100341796875, 3.551025390625, 3.6920166015625, 3.8330078125, 3.9739990234375, 4.114990234375, 4.2559814453125, 4.39697265625, 4.5379638671875, 4.678955078125, 4.8199462890625, 4.9609375]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 6.0, 13.0, 21.0, 37.0, 43.0, 63.0, 109.0, 177.0, 330.0, 525.0, 966.0, 1787.0, 3128.0, 5823.0, 12117.0, 28929.0, 91019.0, 440442.0, 341067.0, 74438.0, 25067.0, 10568.0, 5298.0, 2769.0, 1603.0, 942.0, 530.0, 313.0, 179.0, 99.0, 57.0, 37.0, 20.0, 14.0, 9.0, 4.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0], "bins": [-4.94140625, -4.817626953125, -4.69384765625, -4.570068359375, -4.4462890625, -4.322509765625, -4.19873046875, -4.074951171875, -3.951171875, -3.827392578125, -3.70361328125, -3.579833984375, -3.4560546875, -3.332275390625, -3.20849609375, -3.084716796875, -2.9609375, -2.837158203125, -2.71337890625, -2.589599609375, -2.4658203125, -2.342041015625, -2.21826171875, -2.094482421875, -1.970703125, -1.846923828125, -1.72314453125, -1.599365234375, -1.4755859375, -1.351806640625, -1.22802734375, -1.104248046875, -0.98046875, -0.856689453125, -0.73291015625, -0.609130859375, -0.4853515625, -0.361572265625, -0.23779296875, -0.114013671875, 0.009765625, 0.133544921875, 0.25732421875, 0.381103515625, 0.5048828125, 0.628662109375, 0.75244140625, 0.876220703125, 1.0, 1.123779296875, 1.24755859375, 1.371337890625, 1.4951171875, 1.618896484375, 1.74267578125, 1.866455078125, 1.990234375, 2.114013671875, 2.23779296875, 2.361572265625, 2.4853515625, 2.609130859375, 2.73291015625, 2.856689453125, 2.98046875]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 6.0, 7.0, 6.0, 7.0, 14.0, 13.0, 14.0, 16.0, 24.0, 25.0, 28.0, 43.0, 43.0, 44.0, 52.0, 61.0, 71.0, 306.0, 1725.0, 105.0, 57.0, 46.0, 48.0, 43.0, 39.0, 26.0, 29.0, 33.0, 30.0, 20.0, 20.0, 10.0, 15.0, 8.0, 7.0, 7.0, 5.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.15625, -16.58740234375, -16.0185546875, -15.44970703125, -14.880859375, -14.31201171875, -13.7431640625, -13.17431640625, -12.60546875, -12.03662109375, -11.4677734375, -10.89892578125, -10.330078125, -9.76123046875, -9.1923828125, -8.62353515625, -8.0546875, -7.48583984375, -6.9169921875, -6.34814453125, -5.779296875, -5.21044921875, -4.6416015625, -4.07275390625, -3.50390625, -2.93505859375, -2.3662109375, -1.79736328125, -1.228515625, -0.65966796875, -0.0908203125, 0.47802734375, 1.046875, 1.61572265625, 2.1845703125, 2.75341796875, 3.322265625, 3.89111328125, 4.4599609375, 5.02880859375, 5.59765625, 6.16650390625, 6.7353515625, 7.30419921875, 7.873046875, 8.44189453125, 9.0107421875, 9.57958984375, 10.1484375, 10.71728515625, 11.2861328125, 11.85498046875, 12.423828125, 12.99267578125, 13.5615234375, 14.13037109375, 14.69921875, 15.26806640625, 15.8369140625, 16.40576171875, 16.974609375, 17.54345703125, 18.1123046875, 18.68115234375, 19.25]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 5.0, 7.0, 7.0, 10.0, 11.0, 14.0, 22.0, 29.0, 29.0, 38.0, 40.0, 48.0, 72.0, 118.0, 176.0, 372.0, 1234.0, 11390.0, 2969667.0, 157545.0, 3473.0, 667.0, 269.0, 133.0, 73.0, 65.0, 40.0, 39.0, 29.0, 15.0, 14.0, 11.0, 16.0, 13.0, 5.0, 6.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.15625, -31.20458984375, -30.2529296875, -29.30126953125, -28.349609375, -27.39794921875, -26.4462890625, -25.49462890625, -24.54296875, -23.59130859375, -22.6396484375, -21.68798828125, -20.736328125, -19.78466796875, -18.8330078125, -17.88134765625, -16.9296875, -15.97802734375, -15.0263671875, -14.07470703125, -13.123046875, -12.17138671875, -11.2197265625, -10.26806640625, -9.31640625, -8.36474609375, -7.4130859375, -6.46142578125, -5.509765625, -4.55810546875, -3.6064453125, -2.65478515625, -1.703125, -0.75146484375, 0.2001953125, 1.15185546875, 2.103515625, 3.05517578125, 4.0068359375, 4.95849609375, 5.91015625, 6.86181640625, 7.8134765625, 8.76513671875, 9.716796875, 10.66845703125, 11.6201171875, 12.57177734375, 13.5234375, 14.47509765625, 15.4267578125, 16.37841796875, 17.330078125, 18.28173828125, 19.2333984375, 20.18505859375, 21.13671875, 22.08837890625, 23.0400390625, 23.99169921875, 24.943359375, 25.89501953125, 26.8466796875, 27.79833984375, 28.75]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [18.0, 218.0, 684.0, 92.0, 8.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.627401351928711, -4.445851802825928, -1.2643022537231445, 1.9172477722167969, 5.098796844482422, 8.280345916748047, 11.461896896362305, 14.64344596862793, 17.824995040893555, 21.00654411315918, 24.188095092773438, 27.369644165039062, 30.551193237304688, 33.73274230957031, 36.91429138183594, 40.09584045410156, 43.27738952636719, 46.45893859863281, 49.64048767089844, 52.82203674316406, 56.00358581542969, 59.18513488769531, 62.3666877746582, 65.54823303222656, 68.72978973388672, 71.91133880615234, 75.09288787841797, 78.2744369506836, 81.45598602294922, 84.63753509521484, 87.819091796875, 91.00064086914062, 94.18218994140625, 97.36373901367188, 100.5452880859375, 103.72683715820312, 106.90838623046875, 110.08993530273438, 113.271484375, 116.45303344726562, 119.63458251953125, 122.81613159179688, 125.9976806640625, 129.17922973632812, 132.36077880859375, 135.54232788085938, 138.723876953125, 141.90542602539062, 145.08697509765625, 148.26852416992188, 151.4500732421875, 154.63162231445312, 157.81317138671875, 160.99472045898438, 164.17626953125, 167.35781860351562, 170.5393829345703, 173.72093200683594, 176.90248107910156, 180.0840301513672, 183.2655792236328, 186.44712829589844, 189.62867736816406, 192.8102264404297, 195.9917755126953]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 3.0, 10.0, 5.0, 12.0, 9.0, 12.0, 20.0, 18.0, 22.0, 23.0, 18.0, 18.0, 20.0, 27.0, 27.0, 36.0, 34.0, 39.0, 38.0, 46.0, 31.0, 35.0, 45.0, 39.0, 46.0, 38.0, 36.0, 33.0, 26.0, 40.0, 24.0, 21.0, 19.0, 22.0, 17.0, 13.0, 20.0, 20.0, 13.0, 4.0, 5.0, 4.0, 7.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-50.74734115600586, -49.18922424316406, -47.631107330322266, -46.07299041748047, -44.51487350463867, -42.956756591796875, -41.39863967895508, -39.84052276611328, -38.282405853271484, -36.72428894042969, -35.16617202758789, -33.608055114746094, -32.0499382019043, -30.4918212890625, -28.933704376220703, -27.375587463378906, -25.817468643188477, -24.25935173034668, -22.701234817504883, -21.143117904663086, -19.58500099182129, -18.026884078979492, -16.468765258789062, -14.910649299621582, -13.352532386779785, -11.794415473937988, -10.236298561096191, -8.678180694580078, -7.1200642585754395, -5.561947345733643, -4.0038299560546875, -2.4457130432128906, -0.8875961303710938, 0.6705209016799927, 2.228637933731079, 3.786755084991455, 5.344871997833252, 6.902988910675049, 8.461106300354004, 10.0192232131958, 11.577340126037598, 13.135457038879395, 14.693573951721191, 16.251691818237305, 17.8098087310791, 19.3679256439209, 20.926042556762695, 22.484159469604492, 24.04227638244629, 25.600393295288086, 27.158510208129883, 28.71662712097168, 30.274744033813477, 31.832860946655273, 33.3909797668457, 34.9490966796875, 36.5072135925293, 38.065330505371094, 39.62344741821289, 41.18156433105469, 42.739681243896484, 44.29779815673828, 45.85591506958008, 47.414031982421875, 48.97214889526367]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 5.0, 8.0, 12.0, 4.0, 11.0, 14.0, 17.0, 17.0, 23.0, 28.0, 22.0, 27.0, 35.0, 39.0, 40.0, 30.0, 52.0, 42.0, 49.0, 48.0, 44.0, 38.0, 52.0, 35.0, 47.0, 30.0, 33.0, 24.0, 40.0, 26.0, 24.0, 12.0, 10.0, 15.0, 14.0, 7.0, 9.0, 6.0, 6.0, 5.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3203125, -4.17340087890625, -4.0264892578125, -3.87957763671875, -3.732666015625, -3.58575439453125, -3.4388427734375, -3.29193115234375, -3.14501953125, -2.99810791015625, -2.8511962890625, -2.70428466796875, -2.557373046875, -2.41046142578125, -2.2635498046875, -2.11663818359375, -1.9697265625, -1.82281494140625, -1.6759033203125, -1.52899169921875, -1.382080078125, -1.23516845703125, -1.0882568359375, -0.94134521484375, -0.79443359375, -0.64752197265625, -0.5006103515625, -0.35369873046875, -0.206787109375, -0.05987548828125, 0.0870361328125, 0.23394775390625, 0.380859375, 0.52777099609375, 0.6746826171875, 0.82159423828125, 0.968505859375, 1.11541748046875, 1.2623291015625, 1.40924072265625, 1.55615234375, 1.70306396484375, 1.8499755859375, 1.99688720703125, 2.143798828125, 2.29071044921875, 2.4376220703125, 2.58453369140625, 2.7314453125, 2.87835693359375, 3.0252685546875, 3.17218017578125, 3.319091796875, 3.46600341796875, 3.6129150390625, 3.75982666015625, 3.90673828125, 4.05364990234375, 4.2005615234375, 4.34747314453125, 4.494384765625, 4.64129638671875, 4.7882080078125, 4.93511962890625, 5.08203125]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 6.0, 6.0, 7.0, 10.0, 15.0, 8.0, 26.0, 19.0, 28.0, 28.0, 43.0, 42.0, 55.0, 91.0, 212.0, 1000.0, 8653.0, 242223.0, 3808525.0, 126582.0, 5577.0, 649.0, 141.0, 75.0, 43.0, 40.0, 31.0, 24.0, 25.0, 24.0, 17.0, 17.0, 6.0, 10.0, 10.0, 8.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.640625, -23.80322265625, -22.9658203125, -22.12841796875, -21.291015625, -20.45361328125, -19.6162109375, -18.77880859375, -17.94140625, -17.10400390625, -16.2666015625, -15.42919921875, -14.591796875, -13.75439453125, -12.9169921875, -12.07958984375, -11.2421875, -10.40478515625, -9.5673828125, -8.72998046875, -7.892578125, -7.05517578125, -6.2177734375, -5.38037109375, -4.54296875, -3.70556640625, -2.8681640625, -2.03076171875, -1.193359375, -0.35595703125, 0.4814453125, 1.31884765625, 2.15625, 2.99365234375, 3.8310546875, 4.66845703125, 5.505859375, 6.34326171875, 7.1806640625, 8.01806640625, 8.85546875, 9.69287109375, 10.5302734375, 11.36767578125, 12.205078125, 13.04248046875, 13.8798828125, 14.71728515625, 15.5546875, 16.39208984375, 17.2294921875, 18.06689453125, 18.904296875, 19.74169921875, 20.5791015625, 21.41650390625, 22.25390625, 23.09130859375, 23.9287109375, 24.76611328125, 25.603515625, 26.44091796875, 27.2783203125, 28.11572265625, 28.953125]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 6.0, 5.0, 6.0, 11.0, 8.0, 22.0, 45.0, 66.0, 83.0, 116.0, 202.0, 207.0, 329.0, 476.0, 573.0, 552.0, 447.0, 304.0, 210.0, 144.0, 86.0, 57.0, 40.0, 23.0, 15.0, 14.0, 10.0, 5.0, 5.0, 6.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-21.3125, -20.802001953125, -20.29150390625, -19.781005859375, -19.2705078125, -18.760009765625, -18.24951171875, -17.739013671875, -17.228515625, -16.718017578125, -16.20751953125, -15.697021484375, -15.1865234375, -14.676025390625, -14.16552734375, -13.655029296875, -13.14453125, -12.634033203125, -12.12353515625, -11.613037109375, -11.1025390625, -10.592041015625, -10.08154296875, -9.571044921875, -9.060546875, -8.550048828125, -8.03955078125, -7.529052734375, -7.0185546875, -6.508056640625, -5.99755859375, -5.487060546875, -4.9765625, -4.466064453125, -3.95556640625, -3.445068359375, -2.9345703125, -2.424072265625, -1.91357421875, -1.403076171875, -0.892578125, -0.382080078125, 0.12841796875, 0.638916015625, 1.1494140625, 1.659912109375, 2.17041015625, 2.680908203125, 3.19140625, 3.701904296875, 4.21240234375, 4.722900390625, 5.2333984375, 5.743896484375, 6.25439453125, 6.764892578125, 7.275390625, 7.785888671875, 8.29638671875, 8.806884765625, 9.3173828125, 9.827880859375, 10.33837890625, 10.848876953125, 11.359375]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [3.0, 7.0, 0.0, 16.0, 9.0, 27.0, 39.0, 70.0, 88.0, 183.0, 359.0, 1026.0, 10520.0, 1109813.0, 3051089.0, 18770.0, 1358.0, 392.0, 197.0, 133.0, 68.0, 44.0, 37.0, 16.0, 14.0, 6.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.296875, -23.501220703125, -21.70556640625, -19.909912109375, -18.1142578125, -16.318603515625, -14.52294921875, -12.727294921875, -10.931640625, -9.135986328125, -7.34033203125, -5.544677734375, -3.7490234375, -1.953369140625, -0.15771484375, 1.637939453125, 3.43359375, 5.229248046875, 7.02490234375, 8.820556640625, 10.6162109375, 12.411865234375, 14.20751953125, 16.003173828125, 17.798828125, 19.594482421875, 21.39013671875, 23.185791015625, 24.9814453125, 26.777099609375, 28.57275390625, 30.368408203125, 32.1640625, 33.959716796875, 35.75537109375, 37.551025390625, 39.3466796875, 41.142333984375, 42.93798828125, 44.733642578125, 46.529296875, 48.324951171875, 50.12060546875, 51.916259765625, 53.7119140625, 55.507568359375, 57.30322265625, 59.098876953125, 60.89453125, 62.690185546875, 64.48583984375, 66.281494140625, 68.0771484375, 69.872802734375, 71.66845703125, 73.464111328125, 75.259765625, 77.055419921875, 78.85107421875, 80.646728515625, 82.4423828125, 84.238037109375, 86.03369140625, 87.829345703125, 89.625]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 10.0, 15.0, 48.0, 80.0, 145.0, 229.0, 213.0, 149.0, 61.0, 36.0, 20.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-160.05523681640625, -156.84902954101562, -153.642822265625, -150.4365997314453, -147.2303924560547, -144.02418518066406, -140.81796264648438, -137.61175537109375, -134.40554809570312, -131.1993408203125, -127.99312591552734, -124.78691101074219, -121.58070373535156, -118.37449645996094, -115.16828155517578, -111.96206665039062, -108.755859375, -105.54965209960938, -102.34343719482422, -99.13722229003906, -95.93101501464844, -92.72480773925781, -89.51859283447266, -86.3123779296875, -83.10617065429688, -79.89996337890625, -76.6937484741211, -73.48753356933594, -70.28132629394531, -67.07511901855469, -63.86890411376953, -60.66269302368164, -57.45648956298828, -54.25027847290039, -51.0440673828125, -47.83785629272461, -44.63164520263672, -41.42543411254883, -38.21922302246094, -35.01301193237305, -31.806800842285156, -28.600589752197266, -25.394378662109375, -22.188167572021484, -18.981956481933594, -15.775745391845703, -12.569534301757812, -9.363323211669922, -6.157112121582031, -2.9509010314941406, 0.25531005859375, 3.4615211486816406, 6.667732238769531, 9.873943328857422, 13.080154418945312, 16.286365509033203, 19.492576599121094, 22.698787689208984, 25.904998779296875, 29.111209869384766, 32.317420959472656, 35.52363204956055, 38.72984313964844, 41.93605422973633, 45.14226531982422]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 3.0, 3.0, 4.0, 4.0, 8.0, 7.0, 7.0, 11.0, 14.0, 18.0, 18.0, 32.0, 26.0, 16.0, 44.0, 25.0, 35.0, 34.0, 32.0, 34.0, 38.0, 44.0, 44.0, 37.0, 29.0, 38.0, 42.0, 39.0, 34.0, 19.0, 35.0, 29.0, 33.0, 20.0, 28.0, 20.0, 23.0, 6.0, 12.0, 10.0, 12.0, 15.0, 8.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-42.816436767578125, -41.521385192871094, -40.22633743286133, -38.9312858581543, -37.63623809814453, -36.3411865234375, -35.04613494873047, -33.75108337402344, -32.45603561401367, -31.160985946655273, -29.865936279296875, -28.570884704589844, -27.275835037231445, -25.980785369873047, -24.685733795166016, -23.390684127807617, -22.09563446044922, -20.80058479309082, -19.505535125732422, -18.21048355102539, -16.915433883666992, -15.620384216308594, -14.325333595275879, -13.030282974243164, -11.735233306884766, -10.440183639526367, -9.145133018493652, -7.850082874298096, -6.555032730102539, -5.259982585906982, -3.964932441711426, -2.669881820678711, -1.3748321533203125, -0.07978200912475586, 1.2152681350708008, 2.5103182792663574, 3.805368423461914, 5.100418567657471, 6.395468711853027, 7.690519332885742, 8.98556900024414, 10.280618667602539, 11.575669288635254, 12.870719909667969, 14.165769577026367, 15.460819244384766, 16.755870819091797, 18.050920486450195, 19.345970153808594, 20.641019821166992, 21.93606948852539, 23.231121063232422, 24.52617073059082, 25.82122039794922, 27.11627197265625, 28.41132164001465, 29.706371307373047, 31.001420974731445, 32.296470642089844, 33.591522216796875, 34.886573791503906, 36.18162155151367, 37.4766731262207, 38.77172088623047, 40.0667724609375]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 2.0, 4.0, 5.0, 6.0, 8.0, 11.0, 8.0, 16.0, 15.0, 16.0, 18.0, 16.0, 32.0, 32.0, 38.0, 41.0, 30.0, 34.0, 42.0, 34.0, 44.0, 46.0, 52.0, 34.0, 49.0, 45.0, 34.0, 34.0, 41.0, 24.0, 26.0, 32.0, 22.0, 17.0, 14.0, 16.0, 15.0, 14.0, 9.0, 10.0, 7.0, 7.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.66015625, -4.51409912109375, -4.3680419921875, -4.22198486328125, -4.075927734375, -3.92987060546875, -3.7838134765625, -3.63775634765625, -3.49169921875, -3.34564208984375, -3.1995849609375, -3.05352783203125, -2.907470703125, -2.76141357421875, -2.6153564453125, -2.46929931640625, -2.3232421875, -2.17718505859375, -2.0311279296875, -1.88507080078125, -1.739013671875, -1.59295654296875, -1.4468994140625, -1.30084228515625, -1.15478515625, -1.00872802734375, -0.8626708984375, -0.71661376953125, -0.570556640625, -0.42449951171875, -0.2784423828125, -0.13238525390625, 0.013671875, 0.15972900390625, 0.3057861328125, 0.45184326171875, 0.597900390625, 0.74395751953125, 0.8900146484375, 1.03607177734375, 1.18212890625, 1.32818603515625, 1.4742431640625, 1.62030029296875, 1.766357421875, 1.91241455078125, 2.0584716796875, 2.20452880859375, 2.3505859375, 2.49664306640625, 2.6427001953125, 2.78875732421875, 2.934814453125, 3.08087158203125, 3.2269287109375, 3.37298583984375, 3.51904296875, 3.66510009765625, 3.8111572265625, 3.95721435546875, 4.103271484375, 4.24932861328125, 4.3953857421875, 4.54144287109375, 4.6875]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 5.0, 9.0, 7.0, 4.0, 21.0, 29.0, 53.0, 53.0, 72.0, 130.0, 175.0, 252.0, 346.0, 519.0, 815.0, 1139.0, 1628.0, 2554.0, 3779.0, 5670.0, 8623.0, 13245.0, 20505.0, 32040.0, 50265.0, 80100.0, 123032.0, 169697.0, 172929.0, 127988.0, 84170.0, 52745.0, 33635.0, 21554.0, 13888.0, 8875.0, 5919.0, 3922.0, 2610.0, 1747.0, 1201.0, 825.0, 558.0, 375.0, 286.0, 170.0, 138.0, 88.0, 63.0, 40.0, 24.0, 16.0, 12.0, 8.0, 3.0, 4.0, 3.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.419677734375, -0.4061622619628906, -0.39264678955078125, -0.3791313171386719, -0.3656158447265625, -0.3521003723144531, -0.33858489990234375, -0.3250694274902344, -0.311553955078125, -0.2980384826660156, -0.28452301025390625, -0.2710075378417969, -0.2574920654296875, -0.24397659301757812, -0.23046112060546875, -0.21694564819335938, -0.20343017578125, -0.18991470336914062, -0.17639923095703125, -0.16288375854492188, -0.1493682861328125, -0.13585281372070312, -0.12233734130859375, -0.10882186889648438, -0.095306396484375, -0.08179092407226562, -0.06827545166015625, -0.054759979248046875, -0.0412445068359375, -0.027729034423828125, -0.01421356201171875, -0.000698089599609375, 0.0128173828125, 0.026332855224609375, 0.03984832763671875, 0.053363800048828125, 0.0668792724609375, 0.08039474487304688, 0.09391021728515625, 0.10742568969726562, 0.120941162109375, 0.13445663452148438, 0.14797210693359375, 0.16148757934570312, 0.1750030517578125, 0.18851852416992188, 0.20203399658203125, 0.21554946899414062, 0.22906494140625, 0.24258041381835938, 0.25609588623046875, 0.2696113586425781, 0.2831268310546875, 0.2966423034667969, 0.31015777587890625, 0.3236732482910156, 0.337188720703125, 0.3507041931152344, 0.36421966552734375, 0.3777351379394531, 0.3912506103515625, 0.4047660827636719, 0.41828155517578125, 0.4317970275878906, 0.4453125]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 5.0, 3.0, 6.0, 5.0, 8.0, 13.0, 15.0, 13.0, 22.0, 18.0, 21.0, 26.0, 32.0, 33.0, 33.0, 38.0, 29.0, 35.0, 47.0, 38.0, 47.0, 1063.0, 39.0, 45.0, 38.0, 33.0, 37.0, 44.0, 39.0, 31.0, 25.0, 20.0, 23.0, 19.0, 17.0, 10.0, 16.0, 8.0, 8.0, 10.0, 5.0, 2.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.68359375, -2.59228515625, -2.5009765625, -2.40966796875, -2.318359375, -2.22705078125, -2.1357421875, -2.04443359375, -1.953125, -1.86181640625, -1.7705078125, -1.67919921875, -1.587890625, -1.49658203125, -1.4052734375, -1.31396484375, -1.22265625, -1.13134765625, -1.0400390625, -0.94873046875, -0.857421875, -0.76611328125, -0.6748046875, -0.58349609375, -0.4921875, -0.40087890625, -0.3095703125, -0.21826171875, -0.126953125, -0.03564453125, 0.0556640625, 0.14697265625, 0.23828125, 0.32958984375, 0.4208984375, 0.51220703125, 0.603515625, 0.69482421875, 0.7861328125, 0.87744140625, 0.96875, 1.06005859375, 1.1513671875, 1.24267578125, 1.333984375, 1.42529296875, 1.5166015625, 1.60791015625, 1.69921875, 1.79052734375, 1.8818359375, 1.97314453125, 2.064453125, 2.15576171875, 2.2470703125, 2.33837890625, 2.4296875, 2.52099609375, 2.6123046875, 2.70361328125, 2.794921875, 2.88623046875, 2.9775390625, 3.06884765625, 3.16015625]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0, 10.0, 11.0, 16.0, 32.0, 60.0, 93.0, 149.0, 220.0, 444.0, 741.0, 1259.0, 2210.0, 3875.0, 6876.0, 11823.0, 20662.0, 35539.0, 60717.0, 100157.0, 152237.0, 1236607.0, 170079.0, 118305.0, 72792.0, 42961.0, 25182.0, 14531.0, 8331.0, 4729.0, 2736.0, 1624.0, 896.0, 495.0, 324.0, 160.0, 113.0, 58.0, 30.0, 18.0, 13.0, 11.0, 6.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.430908203125, -0.41883087158203125, -0.4067535400390625, -0.39467620849609375, -0.382598876953125, -0.37052154541015625, -0.3584442138671875, -0.34636688232421875, -0.33428955078125, -0.32221221923828125, -0.3101348876953125, -0.29805755615234375, -0.285980224609375, -0.27390289306640625, -0.2618255615234375, -0.24974822998046875, -0.2376708984375, -0.22559356689453125, -0.2135162353515625, -0.20143890380859375, -0.189361572265625, -0.17728424072265625, -0.1652069091796875, -0.15312957763671875, -0.14105224609375, -0.12897491455078125, -0.1168975830078125, -0.10482025146484375, -0.092742919921875, -0.08066558837890625, -0.0685882568359375, -0.05651092529296875, -0.04443359375, -0.03235626220703125, -0.0202789306640625, -0.00820159912109375, 0.003875732421875, 0.01595306396484375, 0.0280303955078125, 0.04010772705078125, 0.05218505859375, 0.06426239013671875, 0.0763397216796875, 0.08841705322265625, 0.100494384765625, 0.11257171630859375, 0.1246490478515625, 0.13672637939453125, 0.1488037109375, 0.16088104248046875, 0.1729583740234375, 0.18503570556640625, 0.197113037109375, 0.20919036865234375, 0.2212677001953125, 0.23334503173828125, 0.24542236328125, 0.25749969482421875, 0.2695770263671875, 0.28165435791015625, 0.293731689453125, 0.30580902099609375, 0.3178863525390625, 0.32996368408203125, 0.342041015625]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 7.0, 3.0, 5.0, 10.0, 14.0, 17.0, 10.0, 18.0, 16.0, 14.0, 23.0, 41.0, 48.0, 51.0, 56.0, 58.0, 69.0, 67.0, 66.0, 72.0, 67.0, 43.0, 46.0, 41.0, 35.0, 20.0, 22.0, 15.0, 8.0, 14.0, 6.0, 1.0, 5.0, 3.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0036411285400390625, -0.0035358965396881104, -0.003430664539337158, -0.003325432538986206, -0.003220200538635254, -0.0031149685382843018, -0.0030097365379333496, -0.0029045045375823975, -0.0027992725372314453, -0.002694040536880493, -0.002588808536529541, -0.002483576536178589, -0.0023783445358276367, -0.0022731125354766846, -0.0021678805351257324, -0.0020626485347747803, -0.001957416534423828, -0.001852184534072876, -0.0017469525337219238, -0.0016417205333709717, -0.0015364885330200195, -0.0014312565326690674, -0.0013260245323181152, -0.001220792531967163, -0.001115560531616211, -0.0010103285312652588, -0.0009050965309143066, -0.0007998645305633545, -0.0006946325302124023, -0.0005894005298614502, -0.00048416852951049805, -0.0003789365291595459, -0.00027370452880859375, -0.0001684725284576416, -6.324052810668945e-05, 4.1991472244262695e-05, 0.00014722347259521484, 0.000252455472946167, 0.00035768747329711914, 0.0004629194736480713, 0.0005681514739990234, 0.0006733834743499756, 0.0007786154747009277, 0.0008838474750518799, 0.000989079475402832, 0.0010943114757537842, 0.0011995434761047363, 0.0013047754764556885, 0.0014100074768066406, 0.0015152394771575928, 0.001620471477508545, 0.001725703477859497, 0.0018309354782104492, 0.0019361674785614014, 0.0020413994789123535, 0.0021466314792633057, 0.002251863479614258, 0.00235709547996521, 0.002462327480316162, 0.0025675594806671143, 0.0026727914810180664, 0.0027780234813690186, 0.0028832554817199707, 0.002988487482070923, 0.003093719482421875]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 6.0, 8.0, 7.0, 8.0, 13.0, 18.0, 30.0, 39.0, 44.0, 57.0, 71.0, 81.0, 84.0, 143.0, 204.0, 391.0, 770.0, 17784.0, 1021439.0, 5634.0, 619.0, 292.0, 227.0, 152.0, 103.0, 81.0, 55.0, 49.0, 36.0, 21.0, 25.0, 9.0, 14.0, 10.0, 4.0, 9.0, 8.0, 3.0, 3.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.058502197265625, -0.05663871765136719, -0.054775238037109375, -0.05291175842285156, -0.05104827880859375, -0.04918479919433594, -0.047321319580078125, -0.04545783996582031, -0.0435943603515625, -0.04173088073730469, -0.039867401123046875, -0.03800392150878906, -0.03614044189453125, -0.03427696228027344, -0.032413482666015625, -0.030550003051757812, -0.0286865234375, -0.026823043823242188, -0.024959564208984375, -0.023096084594726562, -0.02123260498046875, -0.019369125366210938, -0.017505645751953125, -0.015642166137695312, -0.0137786865234375, -0.011915206909179688, -0.010051727294921875, -0.008188247680664062, -0.00632476806640625, -0.0044612884521484375, -0.002597808837890625, -0.0007343292236328125, 0.001129150390625, 0.0029926300048828125, 0.004856109619140625, 0.0067195892333984375, 0.00858306884765625, 0.010446548461914062, 0.012310028076171875, 0.014173507690429688, 0.0160369873046875, 0.017900466918945312, 0.019763946533203125, 0.021627426147460938, 0.02349090576171875, 0.025354385375976562, 0.027217864990234375, 0.029081344604492188, 0.03094482421875, 0.03280830383300781, 0.034671783447265625, 0.03653526306152344, 0.03839874267578125, 0.04026222229003906, 0.042125701904296875, 0.04398918151855469, 0.0458526611328125, 0.04771614074707031, 0.049579620361328125, 0.05144309997558594, 0.05330657958984375, 0.05517005920410156, 0.057033538818359375, 0.05889701843261719, 0.060760498046875]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1005.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.037998151034116745, -0.036793846637010574, -0.035589538514614105, -0.034385234117507935, -0.033180929720401764, -0.03197662532329559, -0.030772319063544273, -0.029568012803792953, -0.028363708406686783, -0.027159404009580612, -0.025955097749829292, -0.024750791490077972, -0.023546487092971802, -0.02234218269586563, -0.02113787643611431, -0.01993357017636299, -0.01872926577925682, -0.01752496138215065, -0.01632065512239933, -0.015116349793970585, -0.01391204446554184, -0.012707739137113094, -0.011503433808684349, -0.010299128480255604, -0.009094823151826859, -0.007890517823398113, -0.006686212494969368, -0.005481907166540623, -0.0042776018381118774, -0.003073296509683132, -0.001868991181254387, -0.0006646858528256416, 0.0005396232008934021, 0.0017439285293221474, 0.0029482338577508926, 0.004152539186179638, 0.005356844514608383, 0.0065611498430371284, 0.007765455171465874, 0.008969760499894619, 0.010174065828323364, 0.01137837115675211, 0.012582676485180855, 0.0137869818136096, 0.014991287142038345, 0.016195591539144516, 0.017399897798895836, 0.018604204058647156, 0.019808508455753326, 0.021012812852859497, 0.022217119112610817, 0.023421425372362137, 0.024625729769468307, 0.025830034166574478, 0.027034340426325798, 0.028238646686077118, 0.02944295108318329, 0.03064725548028946, 0.03185155987739563, 0.0330558679997921, 0.03426017239689827, 0.03546447679400444, 0.03666878491640091, 0.03787308931350708, 0.03907739371061325]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 5.0, 8.0, 7.0, 14.0, 18.0, 12.0, 32.0, 23.0, 26.0, 32.0, 35.0, 51.0, 58.0, 44.0, 44.0, 62.0, 52.0, 52.0, 63.0, 47.0, 64.0, 41.0, 39.0, 32.0, 22.0, 22.0, 28.0, 16.0, 21.0, 4.0, 13.0, 7.0, 4.0, 7.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0018758773803710938, -0.001799331046640873, -0.0017227847129106522, -0.0016462383791804314, -0.0015696920454502106, -0.0014931457117199898, -0.001416599377989769, -0.0013400530442595482, -0.0012635067105293274, -0.0011869603767991066, -0.0011104140430688858, -0.001033867709338665, -0.0009573213756084442, -0.0008807750418782234, -0.0008042287081480026, -0.0007276823744177818, -0.000651136040687561, -0.0005745897069573402, -0.0004980433732271194, -0.00042149703949689865, -0.00034495070576667786, -0.00026840437203645706, -0.00019185803830623627, -0.00011531170457601547, -3.876537084579468e-05, 3.778096288442612e-05, 0.00011432729661464691, 0.0001908736303448677, 0.0002674199640750885, 0.0003439662978053093, 0.0004205126315355301, 0.0004970589652657509, 0.0005736052989959717, 0.0006501516327261925, 0.0007266979664564133, 0.0008032443001866341, 0.0008797906339168549, 0.0009563369676470757, 0.0010328833013772964, 0.0011094296351075172, 0.001185975968837738, 0.0012625223025679588, 0.0013390686362981796, 0.0014156149700284004, 0.0014921613037586212, 0.001568707637488842, 0.0016452539712190628, 0.0017218003049492836, 0.0017983466386795044, 0.0018748929724097252, 0.001951439306139946, 0.0020279856398701668, 0.0021045319736003876, 0.0021810783073306084, 0.002257624641060829, 0.00233417097479105, 0.0024107173085212708, 0.0024872636422514915, 0.0025638099759817123, 0.002640356309711933, 0.002716902643442154, 0.0027934489771723747, 0.0028699953109025955, 0.0029465416446328163, 0.003023087978363037]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 2.0, 4.0, 5.0, 6.0, 8.0, 11.0, 8.0, 16.0, 15.0, 16.0, 18.0, 16.0, 32.0, 32.0, 38.0, 41.0, 30.0, 34.0, 42.0, 34.0, 44.0, 46.0, 52.0, 34.0, 49.0, 45.0, 34.0, 34.0, 41.0, 24.0, 26.0, 32.0, 22.0, 17.0, 14.0, 16.0, 15.0, 14.0, 9.0, 10.0, 7.0, 7.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.66015625, -4.51409912109375, -4.3680419921875, -4.22198486328125, -4.075927734375, -3.92987060546875, -3.7838134765625, -3.63775634765625, -3.49169921875, -3.34564208984375, -3.1995849609375, -3.05352783203125, -2.907470703125, -2.76141357421875, -2.6153564453125, -2.46929931640625, -2.3232421875, -2.17718505859375, -2.0311279296875, -1.88507080078125, -1.739013671875, -1.59295654296875, -1.4468994140625, -1.30084228515625, -1.15478515625, -1.00872802734375, -0.8626708984375, -0.71661376953125, -0.570556640625, -0.42449951171875, -0.2784423828125, -0.13238525390625, 0.013671875, 0.15972900390625, 0.3057861328125, 0.45184326171875, 0.597900390625, 0.74395751953125, 0.8900146484375, 1.03607177734375, 1.18212890625, 1.32818603515625, 1.4742431640625, 1.62030029296875, 1.766357421875, 1.91241455078125, 2.0584716796875, 2.20452880859375, 2.3505859375, 2.49664306640625, 2.6427001953125, 2.78875732421875, 2.934814453125, 3.08087158203125, 3.2269287109375, 3.37298583984375, 3.51904296875, 3.66510009765625, 3.8111572265625, 3.95721435546875, 4.103271484375, 4.24932861328125, 4.3953857421875, 4.54144287109375, 4.6875]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 8.0, 8.0, 7.0, 10.0, 19.0, 26.0, 21.0, 42.0, 72.0, 92.0, 119.0, 163.0, 315.0, 436.0, 793.0, 1325.0, 2596.0, 5159.0, 10176.0, 23638.0, 66454.0, 252070.0, 480102.0, 133026.0, 40169.0, 15739.0, 7454.0, 3741.0, 1938.0, 1057.0, 622.0, 398.0, 244.0, 136.0, 115.0, 91.0, 53.0, 36.0, 31.0, 20.0, 18.0, 3.0, 8.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.390625, -3.288726806640625, -3.18682861328125, -3.084930419921875, -2.9830322265625, -2.881134033203125, -2.77923583984375, -2.677337646484375, -2.575439453125, -2.473541259765625, -2.37164306640625, -2.269744873046875, -2.1678466796875, -2.065948486328125, -1.96405029296875, -1.862152099609375, -1.76025390625, -1.658355712890625, -1.55645751953125, -1.454559326171875, -1.3526611328125, -1.250762939453125, -1.14886474609375, -1.046966552734375, -0.945068359375, -0.843170166015625, -0.74127197265625, -0.639373779296875, -0.5374755859375, -0.435577392578125, -0.33367919921875, -0.231781005859375, -0.1298828125, -0.027984619140625, 0.07391357421875, 0.175811767578125, 0.2777099609375, 0.379608154296875, 0.48150634765625, 0.583404541015625, 0.685302734375, 0.787200927734375, 0.88909912109375, 0.990997314453125, 1.0928955078125, 1.194793701171875, 1.29669189453125, 1.398590087890625, 1.50048828125, 1.602386474609375, 1.70428466796875, 1.806182861328125, 1.9080810546875, 2.009979248046875, 2.11187744140625, 2.213775634765625, 2.315673828125, 2.417572021484375, 2.51947021484375, 2.621368408203125, 2.7232666015625, 2.825164794921875, 2.92706298828125, 3.028961181640625, 3.130859375]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 3.0, 3.0, 7.0, 4.0, 6.0, 19.0, 17.0, 16.0, 24.0, 23.0, 25.0, 37.0, 28.0, 32.0, 45.0, 46.0, 44.0, 64.0, 77.0, 1697.0, 313.0, 75.0, 62.0, 50.0, 53.0, 49.0, 37.0, 33.0, 29.0, 26.0, 22.0, 22.0, 12.0, 15.0, 10.0, 10.0, 11.0, 4.0, 2.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-18.34375, -17.8177490234375, -17.291748046875, -16.7657470703125, -16.23974609375, -15.7137451171875, -15.187744140625, -14.6617431640625, -14.1357421875, -13.6097412109375, -13.083740234375, -12.5577392578125, -12.03173828125, -11.5057373046875, -10.979736328125, -10.4537353515625, -9.927734375, -9.4017333984375, -8.875732421875, -8.3497314453125, -7.82373046875, -7.2977294921875, -6.771728515625, -6.2457275390625, -5.7197265625, -5.1937255859375, -4.667724609375, -4.1417236328125, -3.61572265625, -3.0897216796875, -2.563720703125, -2.0377197265625, -1.51171875, -0.9857177734375, -0.459716796875, 0.0662841796875, 0.59228515625, 1.1182861328125, 1.644287109375, 2.1702880859375, 2.6962890625, 3.2222900390625, 3.748291015625, 4.2742919921875, 4.80029296875, 5.3262939453125, 5.852294921875, 6.3782958984375, 6.904296875, 7.4302978515625, 7.956298828125, 8.4822998046875, 9.00830078125, 9.5343017578125, 10.060302734375, 10.5863037109375, 11.1123046875, 11.6383056640625, 12.164306640625, 12.6903076171875, 13.21630859375, 13.7423095703125, 14.268310546875, 14.7943115234375, 15.3203125]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 7.0, 2.0, 2.0, 3.0, 12.0, 13.0, 8.0, 5.0, 15.0, 25.0, 18.0, 29.0, 36.0, 33.0, 52.0, 95.0, 114.0, 191.0, 376.0, 934.0, 3434.0, 76101.0, 3043765.0, 16947.0, 2014.0, 640.0, 267.0, 156.0, 111.0, 56.0, 41.0, 50.0, 24.0, 26.0, 24.0, 20.0, 18.0, 13.0, 13.0, 2.0, 10.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.703125, -23.914306640625, -23.12548828125, -22.336669921875, -21.5478515625, -20.759033203125, -19.97021484375, -19.181396484375, -18.392578125, -17.603759765625, -16.81494140625, -16.026123046875, -15.2373046875, -14.448486328125, -13.65966796875, -12.870849609375, -12.08203125, -11.293212890625, -10.50439453125, -9.715576171875, -8.9267578125, -8.137939453125, -7.34912109375, -6.560302734375, -5.771484375, -4.982666015625, -4.19384765625, -3.405029296875, -2.6162109375, -1.827392578125, -1.03857421875, -0.249755859375, 0.5390625, 1.327880859375, 2.11669921875, 2.905517578125, 3.6943359375, 4.483154296875, 5.27197265625, 6.060791015625, 6.849609375, 7.638427734375, 8.42724609375, 9.216064453125, 10.0048828125, 10.793701171875, 11.58251953125, 12.371337890625, 13.16015625, 13.948974609375, 14.73779296875, 15.526611328125, 16.3154296875, 17.104248046875, 17.89306640625, 18.681884765625, 19.470703125, 20.259521484375, 21.04833984375, 21.837158203125, 22.6259765625, 23.414794921875, 24.20361328125, 24.992431640625, 25.78125]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 9.0, 126.0, 715.0, 159.0, 8.0], "bins": [-174.2695770263672, -171.43614196777344, -168.60269165039062, -165.76925659179688, -162.93580627441406, -160.1023712158203, -157.2689208984375, -154.43548583984375, -151.60205078125, -148.76861572265625, -145.93516540527344, -143.1017303466797, -140.26828002929688, -137.43484497070312, -134.60140991210938, -131.76795959472656, -128.93450927734375, -126.10106658935547, -123.26762390136719, -120.43418884277344, -117.60074615478516, -114.76730346679688, -111.9338607788086, -109.10041809082031, -106.26698303222656, -103.43354034423828, -100.60009765625, -97.76666259765625, -94.93321990966797, -92.09977722167969, -89.2663345336914, -86.43289184570312, -83.59944915771484, -80.76600646972656, -77.93256378173828, -75.09912109375, -72.26568603515625, -69.43224334716797, -66.59880065917969, -63.765357971191406, -60.93191909790039, -58.09847640991211, -55.265037536621094, -52.43159484863281, -49.59815216064453, -46.76470947265625, -43.931270599365234, -41.09782791137695, -38.26438903808594, -35.430946350097656, -32.59750747680664, -29.76406478881836, -26.930622100830078, -24.09718132019043, -21.26374053955078, -18.4302978515625, -15.596856117248535, -12.76341438293457, -9.929973602294922, -7.096531867980957, -4.263090133666992, -1.4296483993530273, 1.403792381286621, 4.237235069274902, 7.070675849914551]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 3.0, 4.0, 5.0, 6.0, 9.0, 8.0, 9.0, 12.0, 22.0, 20.0, 26.0, 17.0, 22.0, 18.0, 20.0, 28.0, 28.0, 36.0, 28.0, 27.0, 38.0, 31.0, 40.0, 31.0, 46.0, 38.0, 40.0, 33.0, 33.0, 34.0, 25.0, 32.0, 20.0, 19.0, 19.0, 20.0, 21.0, 17.0, 12.0, 20.0, 19.0, 11.0, 10.0, 11.0, 12.0, 7.0, 5.0, 3.0, 3.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0], "bins": [-44.84918212890625, -43.43840789794922, -42.02763748168945, -40.61686325073242, -39.206092834472656, -37.795318603515625, -36.384544372558594, -34.97377014160156, -33.5629997253418, -32.152225494384766, -30.741455078125, -29.33068084716797, -27.91990852355957, -26.509136199951172, -25.09836196899414, -23.687589645385742, -22.276817321777344, -20.866044998168945, -19.455272674560547, -18.044498443603516, -16.633726119995117, -15.222953796386719, -13.812180519104004, -12.401407241821289, -10.99063491821289, -9.579862594604492, -8.169089317321777, -6.758316516876221, -5.347543716430664, -3.9367709159851074, -2.525998115539551, -1.115224838256836, 0.2955513000488281, 1.7063241004943848, 3.1170969009399414, 4.527869701385498, 5.938642501831055, 7.349415302276611, 8.760188102722168, 10.170961380004883, 11.581733703613281, 12.99250602722168, 14.403279304504395, 15.81405258178711, 17.224824905395508, 18.635597229003906, 20.046371459960938, 21.457143783569336, 22.867916107177734, 24.278688430786133, 25.68946075439453, 27.100234985351562, 28.51100730895996, 29.92177963256836, 31.33255386352539, 32.743324279785156, 34.15409851074219, 35.56487274169922, 36.975643157958984, 38.386417388916016, 39.79718780517578, 41.20796203613281, 42.618736267089844, 44.029510498046875, 45.44028091430664]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 3.0, 3.0, 6.0, 8.0, 13.0, 10.0, 7.0, 17.0, 19.0, 12.0, 22.0, 32.0, 21.0, 36.0, 42.0, 31.0, 35.0, 40.0, 45.0, 41.0, 34.0, 47.0, 44.0, 43.0, 44.0, 44.0, 33.0, 36.0, 26.0, 33.0, 26.0, 24.0, 18.0, 9.0, 18.0, 18.0, 16.0, 10.0, 11.0, 6.0, 12.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.63671875, -4.48858642578125, -4.3404541015625, -4.19232177734375, -4.044189453125, -3.89605712890625, -3.7479248046875, -3.59979248046875, -3.45166015625, -3.30352783203125, -3.1553955078125, -3.00726318359375, -2.859130859375, -2.71099853515625, -2.5628662109375, -2.41473388671875, -2.2666015625, -2.11846923828125, -1.9703369140625, -1.82220458984375, -1.674072265625, -1.52593994140625, -1.3778076171875, -1.22967529296875, -1.08154296875, -0.93341064453125, -0.7852783203125, -0.63714599609375, -0.489013671875, -0.34088134765625, -0.1927490234375, -0.04461669921875, 0.103515625, 0.25164794921875, 0.3997802734375, 0.54791259765625, 0.696044921875, 0.84417724609375, 0.9923095703125, 1.14044189453125, 1.28857421875, 1.43670654296875, 1.5848388671875, 1.73297119140625, 1.881103515625, 2.02923583984375, 2.1773681640625, 2.32550048828125, 2.4736328125, 2.62176513671875, 2.7698974609375, 2.91802978515625, 3.066162109375, 3.21429443359375, 3.3624267578125, 3.51055908203125, 3.65869140625, 3.80682373046875, 3.9549560546875, 4.10308837890625, 4.251220703125, 4.39935302734375, 4.5474853515625, 4.69561767578125, 4.84375]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 3.0, 2.0, 2.0, 3.0, 2.0, 4.0, 8.0, 7.0, 11.0, 6.0, 10.0, 17.0, 25.0, 28.0, 36.0, 45.0, 82.0, 131.0, 204.0, 382.0, 822.0, 1605.0, 3658.0, 9587.0, 28481.0, 109746.0, 721311.0, 2282006.0, 857762.0, 129653.0, 31958.0, 9862.0, 3672.0, 1545.0, 717.0, 363.0, 170.0, 111.0, 68.0, 41.0, 34.0, 21.0, 21.0, 19.0, 15.0, 12.0, 10.0, 3.0, 4.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.6015625, -8.3104248046875, -8.019287109375, -7.7281494140625, -7.43701171875, -7.1458740234375, -6.854736328125, -6.5635986328125, -6.2724609375, -5.9813232421875, -5.690185546875, -5.3990478515625, -5.10791015625, -4.8167724609375, -4.525634765625, -4.2344970703125, -3.943359375, -3.6522216796875, -3.361083984375, -3.0699462890625, -2.77880859375, -2.4876708984375, -2.196533203125, -1.9053955078125, -1.6142578125, -1.3231201171875, -1.031982421875, -0.7408447265625, -0.44970703125, -0.1585693359375, 0.132568359375, 0.4237060546875, 0.71484375, 1.0059814453125, 1.297119140625, 1.5882568359375, 1.87939453125, 2.1705322265625, 2.461669921875, 2.7528076171875, 3.0439453125, 3.3350830078125, 3.626220703125, 3.9173583984375, 4.20849609375, 4.4996337890625, 4.790771484375, 5.0819091796875, 5.373046875, 5.6641845703125, 5.955322265625, 6.2464599609375, 6.53759765625, 6.8287353515625, 7.119873046875, 7.4110107421875, 7.7021484375, 7.9932861328125, 8.284423828125, 8.5755615234375, 8.86669921875, 9.1578369140625, 9.448974609375, 9.7401123046875, 10.03125]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 8.0, 9.0, 21.0, 22.0, 41.0, 60.0, 55.0, 107.0, 141.0, 205.0, 328.0, 422.0, 543.0, 616.0, 461.0, 325.0, 235.0, 164.0, 102.0, 71.0, 48.0, 29.0, 21.0, 13.0, 9.0, 3.0, 4.0, 4.0, 2.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.109375, -16.607666015625, -16.10595703125, -15.604248046875, -15.1025390625, -14.600830078125, -14.09912109375, -13.597412109375, -13.095703125, -12.593994140625, -12.09228515625, -11.590576171875, -11.0888671875, -10.587158203125, -10.08544921875, -9.583740234375, -9.08203125, -8.580322265625, -8.07861328125, -7.576904296875, -7.0751953125, -6.573486328125, -6.07177734375, -5.570068359375, -5.068359375, -4.566650390625, -4.06494140625, -3.563232421875, -3.0615234375, -2.559814453125, -2.05810546875, -1.556396484375, -1.0546875, -0.552978515625, -0.05126953125, 0.450439453125, 0.9521484375, 1.453857421875, 1.95556640625, 2.457275390625, 2.958984375, 3.460693359375, 3.96240234375, 4.464111328125, 4.9658203125, 5.467529296875, 5.96923828125, 6.470947265625, 6.97265625, 7.474365234375, 7.97607421875, 8.477783203125, 8.9794921875, 9.481201171875, 9.98291015625, 10.484619140625, 10.986328125, 11.488037109375, 11.98974609375, 12.491455078125, 12.9931640625, 13.494873046875, 13.99658203125, 14.498291015625, 15.0]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 7.0, 2.0, 1.0, 7.0, 11.0, 15.0, 9.0, 18.0, 20.0, 25.0, 37.0, 43.0, 82.0, 88.0, 101.0, 194.0, 339.0, 556.0, 1379.0, 5073.0, 35135.0, 580777.0, 3369238.0, 179804.0, 16087.0, 2990.0, 920.0, 431.0, 251.0, 180.0, 113.0, 88.0, 53.0, 48.0, 28.0, 34.0, 22.0, 12.0, 11.0, 11.0, 8.0, 8.0, 5.0, 7.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0], "bins": [-29.046875, -28.119384765625, -27.19189453125, -26.264404296875, -25.3369140625, -24.409423828125, -23.48193359375, -22.554443359375, -21.626953125, -20.699462890625, -19.77197265625, -18.844482421875, -17.9169921875, -16.989501953125, -16.06201171875, -15.134521484375, -14.20703125, -13.279541015625, -12.35205078125, -11.424560546875, -10.4970703125, -9.569580078125, -8.64208984375, -7.714599609375, -6.787109375, -5.859619140625, -4.93212890625, -4.004638671875, -3.0771484375, -2.149658203125, -1.22216796875, -0.294677734375, 0.6328125, 1.560302734375, 2.48779296875, 3.415283203125, 4.3427734375, 5.270263671875, 6.19775390625, 7.125244140625, 8.052734375, 8.980224609375, 9.90771484375, 10.835205078125, 11.7626953125, 12.690185546875, 13.61767578125, 14.545166015625, 15.47265625, 16.400146484375, 17.32763671875, 18.255126953125, 19.1826171875, 20.110107421875, 21.03759765625, 21.965087890625, 22.892578125, 23.820068359375, 24.74755859375, 25.675048828125, 26.6025390625, 27.530029296875, 28.45751953125, 29.385009765625, 30.3125]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 5.0, 12.0, 24.0, 32.0, 69.0, 100.0, 124.0, 140.0, 155.0, 119.0, 108.0, 62.0, 26.0, 14.0, 12.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-76.81227111816406, -74.55052185058594, -72.28877258300781, -70.02702331542969, -67.76527404785156, -65.50352478027344, -63.24177932739258, -60.98003005981445, -58.71828079223633, -56.4565315246582, -54.19478225708008, -51.93303298950195, -49.671287536621094, -47.40953826904297, -45.147789001464844, -42.88603973388672, -40.624290466308594, -38.36254119873047, -36.100791931152344, -33.83904266357422, -31.577295303344727, -29.3155460357666, -27.05379867553711, -24.792049407958984, -22.53030014038086, -20.268550872802734, -18.00680160522461, -15.745054244995117, -13.483304977416992, -11.221555709838867, -8.959807395935059, -6.69805908203125, -4.436309814453125, -2.174561023712158, 0.0871877670288086, 2.3489365577697754, 4.610685348510742, 6.872434616088867, 9.134182929992676, 11.395931243896484, 13.65768051147461, 15.919429779052734, 18.18117904663086, 20.44292640686035, 22.704675674438477, 24.9664249420166, 27.228172302246094, 29.48992156982422, 31.751670837402344, 34.01342010498047, 36.275169372558594, 38.53691864013672, 40.798667907714844, 43.06041717529297, 45.32216262817383, 47.58391189575195, 49.84566116333008, 52.1074104309082, 54.36915969848633, 56.63090896606445, 58.89265441894531, 61.15440368652344, 63.41615295410156, 65.67790222167969, 67.93965148925781]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 2.0, 1.0, 7.0, 7.0, 6.0, 5.0, 8.0, 16.0, 13.0, 26.0, 20.0, 22.0, 30.0, 35.0, 34.0, 33.0, 37.0, 39.0, 37.0, 38.0, 51.0, 39.0, 46.0, 42.0, 57.0, 53.0, 44.0, 28.0, 42.0, 32.0, 32.0, 19.0, 20.0, 13.0, 19.0, 15.0, 7.0, 5.0, 7.0, 4.0, 4.0, 0.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.31919860839844, -41.86086654663086, -40.402530670166016, -38.94419860839844, -37.485862731933594, -36.027530670166016, -34.56919860839844, -33.110862731933594, -31.652528762817383, -30.194194793701172, -28.73586082458496, -27.27752685546875, -25.819194793701172, -24.360858917236328, -22.90252685546875, -21.44419288635254, -19.985858917236328, -18.527524948120117, -17.069190979003906, -15.610857963562012, -14.1525239944458, -12.69419002532959, -11.235857009887695, -9.777523040771484, -8.319189071655273, -6.8608551025390625, -5.40252161026001, -3.944188117980957, -2.485854148864746, -1.0275201797485352, 0.4308128356933594, 1.8891468048095703, 3.3474807739257812, 4.805814743041992, 6.264148235321045, 7.722481727600098, 9.180815696716309, 10.63914966583252, 12.097482681274414, 13.555816650390625, 15.014150619506836, 16.472484588623047, 17.930818557739258, 19.38915252685547, 20.847484588623047, 22.30582046508789, 23.76415252685547, 25.22248649597168, 26.68082046508789, 28.1391544342041, 29.597488403320312, 31.05582046508789, 32.514156341552734, 33.97248840332031, 35.430824279785156, 36.889156341552734, 38.34748840332031, 39.80582046508789, 41.264156341552734, 42.72248840332031, 44.180824279785156, 45.639156341552734, 47.09748840332031, 48.555824279785156, 50.01416015625]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 5.0, 4.0, 9.0, 7.0, 6.0, 19.0, 19.0, 13.0, 18.0, 32.0, 21.0, 31.0, 33.0, 24.0, 36.0, 40.0, 48.0, 49.0, 47.0, 48.0, 38.0, 39.0, 41.0, 35.0, 46.0, 33.0, 37.0, 31.0, 32.0, 33.0, 24.0, 18.0, 21.0, 10.0, 13.0, 3.0, 13.0, 10.0, 8.0, 2.0, 4.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.50390625, -5.34686279296875, -5.1898193359375, -5.03277587890625, -4.875732421875, -4.71868896484375, -4.5616455078125, -4.40460205078125, -4.24755859375, -4.09051513671875, -3.9334716796875, -3.77642822265625, -3.619384765625, -3.46234130859375, -3.3052978515625, -3.14825439453125, -2.9912109375, -2.83416748046875, -2.6771240234375, -2.52008056640625, -2.363037109375, -2.20599365234375, -2.0489501953125, -1.89190673828125, -1.73486328125, -1.57781982421875, -1.4207763671875, -1.26373291015625, -1.106689453125, -0.94964599609375, -0.7926025390625, -0.63555908203125, -0.478515625, -0.32147216796875, -0.1644287109375, -0.00738525390625, 0.149658203125, 0.30670166015625, 0.4637451171875, 0.62078857421875, 0.77783203125, 0.93487548828125, 1.0919189453125, 1.24896240234375, 1.406005859375, 1.56304931640625, 1.7200927734375, 1.87713623046875, 2.0341796875, 2.19122314453125, 2.3482666015625, 2.50531005859375, 2.662353515625, 2.81939697265625, 2.9764404296875, 3.13348388671875, 3.29052734375, 3.44757080078125, 3.6046142578125, 3.76165771484375, 3.918701171875, 4.07574462890625, 4.2327880859375, 4.38983154296875, 4.546875]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 6.0, 3.0, 16.0, 18.0, 8.0, 31.0, 34.0, 51.0, 74.0, 88.0, 124.0, 180.0, 267.0, 400.0, 568.0, 803.0, 1150.0, 1713.0, 2478.0, 3857.0, 5902.0, 9038.0, 13980.0, 22122.0, 34545.0, 55387.0, 87665.0, 132525.0, 173248.0, 165699.0, 120940.0, 78440.0, 49300.0, 31134.0, 19910.0, 12512.0, 8047.0, 5270.0, 3525.0, 2342.0, 1578.0, 1068.0, 762.0, 512.0, 346.0, 260.0, 187.0, 137.0, 89.0, 56.0, 47.0, 38.0, 28.0, 21.0, 9.0, 11.0, 5.0, 7.0, 5.0, 3.0, 0.0, 1.0], "bins": [-0.458251953125, -0.44341278076171875, -0.4285736083984375, -0.41373443603515625, -0.398895263671875, -0.38405609130859375, -0.3692169189453125, -0.35437774658203125, -0.33953857421875, -0.32469940185546875, -0.3098602294921875, -0.29502105712890625, -0.280181884765625, -0.26534271240234375, -0.2505035400390625, -0.23566436767578125, -0.2208251953125, -0.20598602294921875, -0.1911468505859375, -0.17630767822265625, -0.161468505859375, -0.14662933349609375, -0.1317901611328125, -0.11695098876953125, -0.10211181640625, -0.08727264404296875, -0.0724334716796875, -0.05759429931640625, -0.042755126953125, -0.02791595458984375, -0.0130767822265625, 0.00176239013671875, 0.0166015625, 0.03144073486328125, 0.0462799072265625, 0.06111907958984375, 0.075958251953125, 0.09079742431640625, 0.1056365966796875, 0.12047576904296875, 0.13531494140625, 0.15015411376953125, 0.1649932861328125, 0.17983245849609375, 0.194671630859375, 0.20951080322265625, 0.2243499755859375, 0.23918914794921875, 0.2540283203125, 0.26886749267578125, 0.2837066650390625, 0.29854583740234375, 0.313385009765625, 0.32822418212890625, 0.3430633544921875, 0.35790252685546875, 0.37274169921875, 0.38758087158203125, 0.4024200439453125, 0.41725921630859375, 0.432098388671875, 0.44693756103515625, 0.4617767333984375, 0.47661590576171875, 0.491455078125]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 10.0, 5.0, 6.0, 7.0, 12.0, 15.0, 20.0, 24.0, 31.0, 26.0, 32.0, 37.0, 42.0, 45.0, 39.0, 56.0, 48.0, 1065.0, 51.0, 63.0, 57.0, 55.0, 41.0, 39.0, 30.0, 25.0, 36.0, 29.0, 29.0, 18.0, 13.0, 15.0, 3.0, 1.0, 1.0, 4.0, 1.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.046875, -3.923858642578125, -3.80084228515625, -3.677825927734375, -3.5548095703125, -3.431793212890625, -3.30877685546875, -3.185760498046875, -3.062744140625, -2.939727783203125, -2.81671142578125, -2.693695068359375, -2.5706787109375, -2.447662353515625, -2.32464599609375, -2.201629638671875, -2.07861328125, -1.955596923828125, -1.83258056640625, -1.709564208984375, -1.5865478515625, -1.463531494140625, -1.34051513671875, -1.217498779296875, -1.094482421875, -0.971466064453125, -0.84844970703125, -0.725433349609375, -0.6024169921875, -0.479400634765625, -0.35638427734375, -0.233367919921875, -0.1103515625, 0.012664794921875, 0.13568115234375, 0.258697509765625, 0.3817138671875, 0.504730224609375, 0.62774658203125, 0.750762939453125, 0.873779296875, 0.996795654296875, 1.11981201171875, 1.242828369140625, 1.3658447265625, 1.488861083984375, 1.61187744140625, 1.734893798828125, 1.85791015625, 1.980926513671875, 2.10394287109375, 2.226959228515625, 2.3499755859375, 2.472991943359375, 2.59600830078125, 2.719024658203125, 2.842041015625, 2.965057373046875, 3.08807373046875, 3.211090087890625, 3.3341064453125, 3.457122802734375, 3.58013916015625, 3.703155517578125, 3.826171875]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 6.0, 9.0, 15.0, 17.0, 25.0, 32.0, 47.0, 114.0, 174.0, 258.0, 438.0, 731.0, 1217.0, 2052.0, 3395.0, 5520.0, 9215.0, 15369.0, 25379.0, 42081.0, 68286.0, 107979.0, 155898.0, 1228516.0, 153608.0, 105608.0, 66709.0, 41099.0, 24865.0, 15166.0, 9175.0, 5618.0, 3322.0, 2081.0, 1217.0, 730.0, 478.0, 242.0, 199.0, 102.0, 55.0, 30.0, 18.0, 15.0, 12.0, 8.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.368408203125, -0.3563232421875, -0.34423828125, -0.3321533203125, -0.320068359375, -0.3079833984375, -0.2958984375, -0.2838134765625, -0.271728515625, -0.2596435546875, -0.24755859375, -0.2354736328125, -0.223388671875, -0.2113037109375, -0.19921875, -0.1871337890625, -0.175048828125, -0.1629638671875, -0.15087890625, -0.1387939453125, -0.126708984375, -0.1146240234375, -0.1025390625, -0.0904541015625, -0.078369140625, -0.0662841796875, -0.05419921875, -0.0421142578125, -0.030029296875, -0.0179443359375, -0.005859375, 0.0062255859375, 0.018310546875, 0.0303955078125, 0.04248046875, 0.0545654296875, 0.066650390625, 0.0787353515625, 0.0908203125, 0.1029052734375, 0.114990234375, 0.1270751953125, 0.13916015625, 0.1512451171875, 0.163330078125, 0.1754150390625, 0.1875, 0.1995849609375, 0.211669921875, 0.2237548828125, 0.23583984375, 0.2479248046875, 0.260009765625, 0.2720947265625, 0.2841796875, 0.2962646484375, 0.308349609375, 0.3204345703125, 0.33251953125, 0.3446044921875, 0.356689453125, 0.3687744140625, 0.380859375, 0.3929443359375, 0.405029296875]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 7.0, 3.0, 3.0, 5.0, 5.0, 9.0, 11.0, 11.0, 14.0, 18.0, 21.0, 21.0, 24.0, 34.0, 53.0, 57.0, 59.0, 69.0, 67.0, 56.0, 73.0, 51.0, 50.0, 63.0, 41.0, 32.0, 22.0, 31.0, 20.0, 19.0, 7.0, 6.0, 9.0, 8.0, 7.0, 5.0, 7.0, 5.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.0033111572265625, -0.003223031759262085, -0.00313490629196167, -0.003046780824661255, -0.00295865535736084, -0.002870529890060425, -0.0027824044227600098, -0.0026942789554595947, -0.0026061534881591797, -0.0025180280208587646, -0.0024299025535583496, -0.0023417770862579346, -0.0022536516189575195, -0.0021655261516571045, -0.0020774006843566895, -0.0019892752170562744, -0.0019011497497558594, -0.0018130242824554443, -0.0017248988151550293, -0.0016367733478546143, -0.0015486478805541992, -0.0014605224132537842, -0.0013723969459533691, -0.001284271478652954, -0.001196146011352539, -0.001108020544052124, -0.001019895076751709, -0.0009317696094512939, -0.0008436441421508789, -0.0007555186748504639, -0.0006673932075500488, -0.0005792677402496338, -0.0004911422729492188, -0.0004030168056488037, -0.00031489133834838867, -0.00022676587104797363, -0.0001386404037475586, -5.0514936447143555e-05, 3.7610530853271484e-05, 0.00012573599815368652, 0.00021386146545410156, 0.0003019869327545166, 0.00039011240005493164, 0.0004782378673553467, 0.0005663633346557617, 0.0006544888019561768, 0.0007426142692565918, 0.0008307397365570068, 0.0009188652038574219, 0.001006990671157837, 0.001095116138458252, 0.001183241605758667, 0.001271367073059082, 0.001359492540359497, 0.0014476180076599121, 0.0015357434749603271, 0.0016238689422607422, 0.0017119944095611572, 0.0018001198768615723, 0.0018882453441619873, 0.0019763708114624023, 0.0020644962787628174, 0.0021526217460632324, 0.0022407472133636475, 0.0023288726806640625]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 7.0, 6.0, 5.0, 13.0, 10.0, 11.0, 11.0, 19.0, 25.0, 42.0, 55.0, 78.0, 99.0, 123.0, 202.0, 283.0, 535.0, 3627.0, 953122.0, 87945.0, 1095.0, 403.0, 239.0, 148.0, 121.0, 100.0, 57.0, 49.0, 44.0, 22.0, 19.0, 14.0, 9.0, 6.0, 7.0, 2.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.047515869140625, -0.04574155807495117, -0.043967247009277344, -0.042192935943603516, -0.04041862487792969, -0.03864431381225586, -0.03687000274658203, -0.0350956916809082, -0.033321380615234375, -0.03154706954956055, -0.02977275848388672, -0.02799844741821289, -0.026224136352539062, -0.024449825286865234, -0.022675514221191406, -0.020901203155517578, -0.01912689208984375, -0.017352581024169922, -0.015578269958496094, -0.013803958892822266, -0.012029647827148438, -0.01025533676147461, -0.008481025695800781, -0.006706714630126953, -0.004932403564453125, -0.003158092498779297, -0.0013837814331054688, 0.0003905296325683594, 0.0021648406982421875, 0.003939151763916016, 0.005713462829589844, 0.007487773895263672, 0.0092620849609375, 0.011036396026611328, 0.012810707092285156, 0.014585018157958984, 0.016359329223632812, 0.01813364028930664, 0.01990795135498047, 0.021682262420654297, 0.023456573486328125, 0.025230884552001953, 0.02700519561767578, 0.02877950668334961, 0.030553817749023438, 0.032328128814697266, 0.034102439880371094, 0.03587675094604492, 0.03765106201171875, 0.03942537307739258, 0.041199684143066406, 0.042973995208740234, 0.04474830627441406, 0.04652261734008789, 0.04829692840576172, 0.05007123947143555, 0.051845550537109375, 0.0536198616027832, 0.05539417266845703, 0.05716848373413086, 0.05894279479980469, 0.060717105865478516, 0.062491416931152344, 0.06426572799682617, 0.0660400390625]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 10.0, 443.0, 531.0, 31.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.016857799142599106, -0.016347317025065422, -0.015836836770176888, -0.015326354652643204, -0.014815873466432095, -0.014305392280220985, -0.013794910162687302, -0.013284428976476192, -0.012773947790265083, -0.012263466604053974, -0.011752985417842865, -0.011242503300309181, -0.010732022114098072, -0.010221540927886963, -0.009711058810353279, -0.00920057762414217, -0.00869009643793106, -0.008179615251719952, -0.007669133599847555, -0.007158651947975159, -0.0066481707617640495, -0.00613768957555294, -0.005627207923680544, -0.005116726271808147, -0.004606245085597038, -0.004095763899385929, -0.0035852822475135326, -0.00307480082847178, -0.002564319409430027, -0.002053837990388274, -0.0015433565713465214, -0.0010328751523047686, -0.000522395595908165, -1.1914176866412163e-05, 0.0004985672421753407, 0.0010090486612170935, 0.0015195300802588463, 0.002030011499300599, 0.002540492918342352, 0.0030509743373841047, 0.0035614557564258575, 0.004071936942636967, 0.004582418594509363, 0.00509290024638176, 0.005603381432592869, 0.006113862618803978, 0.0066243442706763744, 0.007134825922548771, 0.00764530710875988, 0.00815578829497099, 0.008666269481182098, 0.009176751598715782, 0.009687232784926891, 0.010197713971138, 0.010708196088671684, 0.011218677274882793, 0.011729158461093903, 0.012239639647305012, 0.012750120833516121, 0.013260602951049805, 0.013771084137260914, 0.014281565323472023, 0.014792047441005707, 0.015302528627216816, 0.015813009813427925]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 5.0, 4.0, 2.0, 3.0, 10.0, 5.0, 8.0, 9.0, 10.0, 22.0, 25.0, 13.0, 20.0, 24.0, 26.0, 32.0, 23.0, 37.0, 31.0, 33.0, 31.0, 24.0, 36.0, 45.0, 52.0, 47.0, 45.0, 34.0, 36.0, 28.0, 42.0, 23.0, 31.0, 24.0, 20.0, 29.0, 12.0, 17.0, 14.0, 10.0, 17.0, 13.0, 13.0, 5.0, 3.0, 2.0, 3.0, 5.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0013415217399597168, -0.0012950357049703598, -0.0012485496699810028, -0.0012020636349916458, -0.0011555776000022888, -0.0011090915650129318, -0.0010626055300235748, -0.0010161194950342178, -0.0009696334600448608, -0.0009231474250555038, -0.0008766613900661469, -0.0008301753550767899, -0.0007836893200874329, -0.0007372032850980759, -0.0006907172501087189, -0.0006442312151193619, -0.0005977451801300049, -0.0005512591451406479, -0.0005047731101512909, -0.0004582870751619339, -0.0004118010401725769, -0.0003653150051832199, -0.0003188289701938629, -0.0002723429352045059, -0.00022585690021514893, -0.00017937086522579193, -0.00013288483023643494, -8.639879524707794e-05, -3.991276025772095e-05, 6.573274731636047e-06, 5.305930972099304e-05, 9.954534471035004e-05, 0.00014603137969970703, 0.00019251741468906403, 0.00023900344967842102, 0.000285489484667778, 0.000331975519657135, 0.000378461554646492, 0.000424947589635849, 0.000471433624625206, 0.000517919659614563, 0.00056440569460392, 0.000610891729593277, 0.000657377764582634, 0.000703863799571991, 0.000750349834561348, 0.000796835869550705, 0.000843321904540062, 0.0008898079395294189, 0.0009362939745187759, 0.000982780009508133, 0.00102926604449749, 0.001075752079486847, 0.001122238114476204, 0.001168724149465561, 0.001215210184454918, 0.001261696219444275, 0.001308182254433632, 0.001354668289422989, 0.0014011543244123459, 0.0014476403594017029, 0.0014941263943910599, 0.0015406124293804169, 0.0015870984643697739, 0.0016335844993591309]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 5.0, 4.0, 9.0, 7.0, 6.0, 19.0, 19.0, 13.0, 18.0, 32.0, 21.0, 31.0, 33.0, 24.0, 36.0, 40.0, 48.0, 49.0, 47.0, 48.0, 38.0, 39.0, 41.0, 35.0, 46.0, 33.0, 37.0, 31.0, 32.0, 33.0, 24.0, 18.0, 21.0, 10.0, 13.0, 3.0, 13.0, 10.0, 8.0, 2.0, 4.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.50390625, -5.34686279296875, -5.1898193359375, -5.03277587890625, -4.875732421875, -4.71868896484375, -4.5616455078125, -4.40460205078125, -4.24755859375, -4.09051513671875, -3.9334716796875, -3.77642822265625, -3.619384765625, -3.46234130859375, -3.3052978515625, -3.14825439453125, -2.9912109375, -2.83416748046875, -2.6771240234375, -2.52008056640625, -2.363037109375, -2.20599365234375, -2.0489501953125, -1.89190673828125, -1.73486328125, -1.57781982421875, -1.4207763671875, -1.26373291015625, -1.106689453125, -0.94964599609375, -0.7926025390625, -0.63555908203125, -0.478515625, -0.32147216796875, -0.1644287109375, -0.00738525390625, 0.149658203125, 0.30670166015625, 0.4637451171875, 0.62078857421875, 0.77783203125, 0.93487548828125, 1.0919189453125, 1.24896240234375, 1.406005859375, 1.56304931640625, 1.7200927734375, 1.87713623046875, 2.0341796875, 2.19122314453125, 2.3482666015625, 2.50531005859375, 2.662353515625, 2.81939697265625, 2.9764404296875, 3.13348388671875, 3.29052734375, 3.44757080078125, 3.6046142578125, 3.76165771484375, 3.918701171875, 4.07574462890625, 4.2327880859375, 4.38983154296875, 4.546875]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 8.0, 4.0, 5.0, 16.0, 12.0, 17.0, 33.0, 47.0, 64.0, 100.0, 127.0, 189.0, 265.0, 413.0, 626.0, 964.0, 1428.0, 2303.0, 4158.0, 8233.0, 19779.0, 63299.0, 265849.0, 489946.0, 129315.0, 34752.0, 12404.0, 5773.0, 3169.0, 1792.0, 1121.0, 749.0, 535.0, 315.0, 231.0, 159.0, 110.0, 75.0, 46.0, 42.0, 25.0, 15.0, 17.0, 6.0, 4.0, 4.0, 8.0, 11.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.0390625, -3.913848876953125, -3.78863525390625, -3.663421630859375, -3.5382080078125, -3.412994384765625, -3.28778076171875, -3.162567138671875, -3.037353515625, -2.912139892578125, -2.78692626953125, -2.661712646484375, -2.5364990234375, -2.411285400390625, -2.28607177734375, -2.160858154296875, -2.03564453125, -1.910430908203125, -1.78521728515625, -1.660003662109375, -1.5347900390625, -1.409576416015625, -1.28436279296875, -1.159149169921875, -1.033935546875, -0.908721923828125, -0.78350830078125, -0.658294677734375, -0.5330810546875, -0.407867431640625, -0.28265380859375, -0.157440185546875, -0.0322265625, 0.092987060546875, 0.21820068359375, 0.343414306640625, 0.4686279296875, 0.593841552734375, 0.71905517578125, 0.844268798828125, 0.969482421875, 1.094696044921875, 1.21990966796875, 1.345123291015625, 1.4703369140625, 1.595550537109375, 1.72076416015625, 1.845977783203125, 1.97119140625, 2.096405029296875, 2.22161865234375, 2.346832275390625, 2.4720458984375, 2.597259521484375, 2.72247314453125, 2.847686767578125, 2.972900390625, 3.098114013671875, 3.22332763671875, 3.348541259765625, 3.4737548828125, 3.598968505859375, 3.72418212890625, 3.849395751953125, 3.974609375]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 7.0, 4.0, 1.0, 4.0, 8.0, 12.0, 9.0, 9.0, 15.0, 16.0, 26.0, 24.0, 26.0, 34.0, 31.0, 51.0, 54.0, 49.0, 62.0, 113.0, 1731.0, 276.0, 77.0, 55.0, 49.0, 48.0, 39.0, 37.0, 37.0, 21.0, 29.0, 27.0, 17.0, 11.0, 12.0, 11.0, 9.0, 7.0, 6.0, 2.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.859375, -16.25244140625, -15.6455078125, -15.03857421875, -14.431640625, -13.82470703125, -13.2177734375, -12.61083984375, -12.00390625, -11.39697265625, -10.7900390625, -10.18310546875, -9.576171875, -8.96923828125, -8.3623046875, -7.75537109375, -7.1484375, -6.54150390625, -5.9345703125, -5.32763671875, -4.720703125, -4.11376953125, -3.5068359375, -2.89990234375, -2.29296875, -1.68603515625, -1.0791015625, -0.47216796875, 0.134765625, 0.74169921875, 1.3486328125, 1.95556640625, 2.5625, 3.16943359375, 3.7763671875, 4.38330078125, 4.990234375, 5.59716796875, 6.2041015625, 6.81103515625, 7.41796875, 8.02490234375, 8.6318359375, 9.23876953125, 9.845703125, 10.45263671875, 11.0595703125, 11.66650390625, 12.2734375, 12.88037109375, 13.4873046875, 14.09423828125, 14.701171875, 15.30810546875, 15.9150390625, 16.52197265625, 17.12890625, 17.73583984375, 18.3427734375, 18.94970703125, 19.556640625, 20.16357421875, 20.7705078125, 21.37744140625, 21.984375]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 0.0, 2.0, 13.0, 4.0, 3.0, 14.0, 12.0, 11.0, 19.0, 24.0, 31.0, 42.0, 49.0, 69.0, 76.0, 126.0, 218.0, 460.0, 1378.0, 18918.0, 3061004.0, 59624.0, 2330.0, 491.0, 243.0, 153.0, 97.0, 72.0, 51.0, 42.0, 26.0, 23.0, 16.0, 19.0, 7.0, 11.0, 12.0, 5.0, 1.0, 5.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-35.875, -34.895751953125, -33.91650390625, -32.937255859375, -31.9580078125, -30.978759765625, -29.99951171875, -29.020263671875, -28.041015625, -27.061767578125, -26.08251953125, -25.103271484375, -24.1240234375, -23.144775390625, -22.16552734375, -21.186279296875, -20.20703125, -19.227783203125, -18.24853515625, -17.269287109375, -16.2900390625, -15.310791015625, -14.33154296875, -13.352294921875, -12.373046875, -11.393798828125, -10.41455078125, -9.435302734375, -8.4560546875, -7.476806640625, -6.49755859375, -5.518310546875, -4.5390625, -3.559814453125, -2.58056640625, -1.601318359375, -0.6220703125, 0.357177734375, 1.33642578125, 2.315673828125, 3.294921875, 4.274169921875, 5.25341796875, 6.232666015625, 7.2119140625, 8.191162109375, 9.17041015625, 10.149658203125, 11.12890625, 12.108154296875, 13.08740234375, 14.066650390625, 15.0458984375, 16.025146484375, 17.00439453125, 17.983642578125, 18.962890625, 19.942138671875, 20.92138671875, 21.900634765625, 22.8798828125, 23.859130859375, 24.83837890625, 25.817626953125, 26.796875]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 42.0, 330.0, 538.0, 97.0, 10.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.038566589355469, -11.344952583312988, -8.651338577270508, -5.957724571228027, -3.264110565185547, -0.5704965591430664, 2.123117446899414, 4.816730499267578, 7.510345458984375, 10.203959465026855, 12.897573471069336, 15.591187477111816, 18.284801483154297, 20.978416442871094, 23.672029495239258, 26.365642547607422, 29.05925750732422, 31.752872467041016, 34.44648742675781, 37.140098571777344, 39.83371353149414, 42.52732849121094, 45.22093963623047, 47.914554595947266, 50.60816955566406, 53.30178451538086, 55.995399475097656, 58.68901062011719, 61.382625579833984, 64.07624053955078, 66.76985168457031, 69.46347045898438, 72.15708923339844, 74.85070037841797, 77.54431915283203, 80.23793029785156, 82.93154907226562, 85.62516021728516, 88.31877136230469, 91.01239013671875, 93.70600128173828, 96.39961242675781, 99.09323120117188, 101.7868423461914, 104.48045349121094, 107.174072265625, 109.86768341064453, 112.56129455566406, 115.25491333007812, 117.94852447509766, 120.64214324951172, 123.33575439453125, 126.02937316894531, 128.7229766845703, 131.41659545898438, 134.11021423339844, 136.8038330078125, 139.49745178222656, 142.19105529785156, 144.88467407226562, 147.5782928466797, 150.2718963623047, 152.96551513671875, 155.6591339111328, 158.3527374267578]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 5.0, 7.0, 5.0, 6.0, 11.0, 9.0, 7.0, 11.0, 9.0, 14.0, 16.0, 14.0, 16.0, 20.0, 24.0, 14.0, 35.0, 29.0, 26.0, 39.0, 45.0, 28.0, 31.0, 36.0, 29.0, 36.0, 36.0, 33.0, 28.0, 53.0, 36.0, 38.0, 25.0, 29.0, 18.0, 17.0, 24.0, 19.0, 15.0, 16.0, 12.0, 15.0, 13.0, 7.0, 14.0, 4.0, 13.0, 4.0, 1.0, 6.0, 4.0, 4.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-50.27008819580078, -48.72826385498047, -47.186439514160156, -45.64461898803711, -44.1027946472168, -42.560970306396484, -41.01914978027344, -39.477325439453125, -37.93550109863281, -36.3936767578125, -34.85185241699219, -33.31003189086914, -31.768207550048828, -30.226383209228516, -28.684560775756836, -27.142738342285156, -25.600914001464844, -24.05908966064453, -22.51726722717285, -20.975444793701172, -19.43362045288086, -17.891796112060547, -16.349973678588867, -14.808150291442871, -13.266326904296875, -11.724503517150879, -10.182680130004883, -8.640856742858887, -7.099033355712891, -5.5572099685668945, -4.015386581420898, -2.4735631942749023, -0.9317359924316406, 0.6100873947143555, 2.1519107818603516, 3.6937341690063477, 5.235557556152344, 6.77738094329834, 8.319204330444336, 9.861027717590332, 11.402851104736328, 12.944674491882324, 14.48649787902832, 16.0283203125, 17.570144653320312, 19.111968994140625, 20.653791427612305, 22.195613861083984, 23.737438201904297, 25.27926254272461, 26.82108497619629, 28.36290740966797, 29.90473175048828, 31.446556091308594, 32.988380432128906, 34.53020095825195, 36.072025299072266, 37.61384963989258, 39.155670166015625, 40.69749450683594, 42.23931884765625, 43.78114318847656, 45.322967529296875, 46.86478805541992, 48.406612396240234]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 1.0, 6.0, 5.0, 8.0, 7.0, 7.0, 22.0, 15.0, 13.0, 25.0, 25.0, 26.0, 25.0, 32.0, 32.0, 32.0, 37.0, 51.0, 51.0, 34.0, 45.0, 47.0, 38.0, 35.0, 39.0, 42.0, 36.0, 33.0, 32.0, 29.0, 37.0, 26.0, 15.0, 17.0, 18.0, 10.0, 11.0, 6.0, 8.0, 8.0, 10.0, 0.0, 3.0, 3.0, 2.0, 5.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.5078125, -5.350830078125, -5.19384765625, -5.036865234375, -4.8798828125, -4.722900390625, -4.56591796875, -4.408935546875, -4.251953125, -4.094970703125, -3.93798828125, -3.781005859375, -3.6240234375, -3.467041015625, -3.31005859375, -3.153076171875, -2.99609375, -2.839111328125, -2.68212890625, -2.525146484375, -2.3681640625, -2.211181640625, -2.05419921875, -1.897216796875, -1.740234375, -1.583251953125, -1.42626953125, -1.269287109375, -1.1123046875, -0.955322265625, -0.79833984375, -0.641357421875, -0.484375, -0.327392578125, -0.17041015625, -0.013427734375, 0.1435546875, 0.300537109375, 0.45751953125, 0.614501953125, 0.771484375, 0.928466796875, 1.08544921875, 1.242431640625, 1.3994140625, 1.556396484375, 1.71337890625, 1.870361328125, 2.02734375, 2.184326171875, 2.34130859375, 2.498291015625, 2.6552734375, 2.812255859375, 2.96923828125, 3.126220703125, 3.283203125, 3.440185546875, 3.59716796875, 3.754150390625, 3.9111328125, 4.068115234375, 4.22509765625, 4.382080078125, 4.5390625]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 6.0, 3.0, 8.0, 8.0, 5.0, 15.0, 17.0, 21.0, 15.0, 17.0, 31.0, 33.0, 42.0, 104.0, 161.0, 360.0, 851.0, 3031.0, 14341.0, 103183.0, 1710362.0, 2196482.0, 142218.0, 17737.0, 3441.0, 952.0, 354.0, 167.0, 91.0, 49.0, 42.0, 21.0, 23.0, 17.0, 18.0, 14.0, 10.0, 7.0, 7.0, 8.0, 7.0, 1.0, 5.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-16.3125, -15.8336181640625, -15.354736328125, -14.8758544921875, -14.39697265625, -13.9180908203125, -13.439208984375, -12.9603271484375, -12.4814453125, -12.0025634765625, -11.523681640625, -11.0447998046875, -10.56591796875, -10.0870361328125, -9.608154296875, -9.1292724609375, -8.650390625, -8.1715087890625, -7.692626953125, -7.2137451171875, -6.73486328125, -6.2559814453125, -5.777099609375, -5.2982177734375, -4.8193359375, -4.3404541015625, -3.861572265625, -3.3826904296875, -2.90380859375, -2.4249267578125, -1.946044921875, -1.4671630859375, -0.98828125, -0.5093994140625, -0.030517578125, 0.4483642578125, 0.92724609375, 1.4061279296875, 1.885009765625, 2.3638916015625, 2.8427734375, 3.3216552734375, 3.800537109375, 4.2794189453125, 4.75830078125, 5.2371826171875, 5.716064453125, 6.1949462890625, 6.673828125, 7.1527099609375, 7.631591796875, 8.1104736328125, 8.58935546875, 9.0682373046875, 9.547119140625, 10.0260009765625, 10.5048828125, 10.9837646484375, 11.462646484375, 11.9415283203125, 12.42041015625, 12.8992919921875, 13.378173828125, 13.8570556640625, 14.3359375]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 8.0, 11.0, 16.0, 20.0, 28.0, 53.0, 79.0, 88.0, 156.0, 193.0, 326.0, 461.0, 586.0, 553.0, 468.0, 319.0, 262.0, 139.0, 101.0, 72.0, 47.0, 29.0, 19.0, 15.0, 14.0, 4.0, 5.0, 6.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-20.328125, -19.8197021484375, -19.311279296875, -18.8028564453125, -18.29443359375, -17.7860107421875, -17.277587890625, -16.7691650390625, -16.2607421875, -15.7523193359375, -15.243896484375, -14.7354736328125, -14.22705078125, -13.7186279296875, -13.210205078125, -12.7017822265625, -12.193359375, -11.6849365234375, -11.176513671875, -10.6680908203125, -10.15966796875, -9.6512451171875, -9.142822265625, -8.6343994140625, -8.1259765625, -7.6175537109375, -7.109130859375, -6.6007080078125, -6.09228515625, -5.5838623046875, -5.075439453125, -4.5670166015625, -4.05859375, -3.5501708984375, -3.041748046875, -2.5333251953125, -2.02490234375, -1.5164794921875, -1.008056640625, -0.4996337890625, 0.0087890625, 0.5172119140625, 1.025634765625, 1.5340576171875, 2.04248046875, 2.5509033203125, 3.059326171875, 3.5677490234375, 4.076171875, 4.5845947265625, 5.093017578125, 5.6014404296875, 6.10986328125, 6.6182861328125, 7.126708984375, 7.6351318359375, 8.1435546875, 8.6519775390625, 9.160400390625, 9.6688232421875, 10.17724609375, 10.6856689453125, 11.194091796875, 11.7025146484375, 12.2109375]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 7.0, 9.0, 9.0, 17.0, 19.0, 25.0, 29.0, 43.0, 62.0, 97.0, 126.0, 197.0, 388.0, 877.0, 3427.0, 33745.0, 1341233.0, 2747850.0, 59150.0, 4779.0, 1047.0, 451.0, 211.0, 152.0, 79.0, 71.0, 52.0, 38.0, 23.0, 18.0, 16.0, 5.0, 8.0, 13.0, 4.0, 2.0, 1.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.53125, -29.404296875, -28.27734375, -27.150390625, -26.0234375, -24.896484375, -23.76953125, -22.642578125, -21.515625, -20.388671875, -19.26171875, -18.134765625, -17.0078125, -15.880859375, -14.75390625, -13.626953125, -12.5, -11.373046875, -10.24609375, -9.119140625, -7.9921875, -6.865234375, -5.73828125, -4.611328125, -3.484375, -2.357421875, -1.23046875, -0.103515625, 1.0234375, 2.150390625, 3.27734375, 4.404296875, 5.53125, 6.658203125, 7.78515625, 8.912109375, 10.0390625, 11.166015625, 12.29296875, 13.419921875, 14.546875, 15.673828125, 16.80078125, 17.927734375, 19.0546875, 20.181640625, 21.30859375, 22.435546875, 23.5625, 24.689453125, 25.81640625, 26.943359375, 28.0703125, 29.197265625, 30.32421875, 31.451171875, 32.578125, 33.705078125, 34.83203125, 35.958984375, 37.0859375, 38.212890625, 39.33984375, 40.466796875, 41.59375]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 30.0, 142.0, 363.0, 322.0, 132.0, 18.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-290.1250305175781, -283.5070495605469, -276.8890686035156, -270.2710876464844, -263.6531066894531, -257.03515625, -250.4171600341797, -243.79917907714844, -237.18121337890625, -230.563232421875, -223.94525146484375, -217.3272705078125, -210.7093048095703, -204.09132385253906, -197.4733428955078, -190.85536193847656, -184.2373809814453, -177.61940002441406, -171.0014190673828, -164.38345336914062, -157.76547241210938, -151.14749145507812, -144.52951049804688, -137.91152954101562, -131.29354858398438, -124.67556762695312, -118.0575942993164, -111.43961334228516, -104.82164001464844, -98.20365905761719, -91.58567810058594, -84.96769714355469, -78.34971618652344, -71.73173522949219, -65.11376190185547, -58.49578094482422, -51.877803802490234, -45.25982666015625, -38.641845703125, -32.023868560791016, -25.40589141845703, -18.787914276123047, -12.16993522644043, -5.5519561767578125, 1.0660209655761719, 7.683998107910156, 14.301979064941406, 20.91995620727539, 27.537933349609375, 34.15591049194336, 40.773887634277344, 47.391868591308594, 54.00984573364258, 60.62782287597656, 67.24580383300781, 73.86378479003906, 80.48175811767578, 87.09973907470703, 93.71771240234375, 100.335693359375, 106.95367431640625, 113.57164764404297, 120.18962860107422, 126.80760192871094, 133.4255828857422]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 3.0, 4.0, 6.0, 15.0, 8.0, 6.0, 13.0, 13.0, 22.0, 22.0, 26.0, 26.0, 23.0, 30.0, 32.0, 32.0, 38.0, 28.0, 34.0, 46.0, 47.0, 31.0, 46.0, 41.0, 43.0, 40.0, 30.0, 39.0, 37.0, 31.0, 33.0, 21.0, 20.0, 18.0, 16.0, 19.0, 15.0, 13.0, 6.0, 11.0, 8.0, 5.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.915924072265625, -41.523773193359375, -40.131622314453125, -38.739471435546875, -37.347320556640625, -35.95517349243164, -34.56302261352539, -33.17087173461914, -31.77872085571289, -30.38656997680664, -28.99441909790039, -27.602270126342773, -26.210119247436523, -24.817968368530273, -23.425819396972656, -22.033668518066406, -20.641517639160156, -19.249366760253906, -17.857215881347656, -16.46506690979004, -15.072916030883789, -13.680765151977539, -12.288615226745605, -10.896465301513672, -9.504314422607422, -8.112163543701172, -6.720013618469238, -5.3278632164001465, -3.9357128143310547, -2.543562412261963, -1.151412010192871, 0.2407379150390625, 1.6328887939453125, 3.0250391960144043, 4.417189598083496, 5.809340000152588, 7.20149040222168, 8.59364128112793, 9.985791206359863, 11.377941131591797, 12.770092010498047, 14.162242889404297, 15.55439281463623, 16.946542739868164, 18.338693618774414, 19.730844497680664, 21.12299346923828, 22.51514434814453, 23.90729522705078, 25.29944610595703, 26.69159698486328, 28.0837459564209, 29.47589683532715, 30.8680477142334, 32.260196685791016, 33.652347564697266, 35.044498443603516, 36.436649322509766, 37.828800201416016, 39.220951080322266, 40.61309814453125, 42.0052490234375, 43.39739990234375, 44.78955078125, 46.18170166015625]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 3.0, 5.0, 5.0, 5.0, 8.0, 14.0, 11.0, 20.0, 22.0, 18.0, 16.0, 25.0, 28.0, 23.0, 25.0, 34.0, 34.0, 41.0, 46.0, 41.0, 34.0, 41.0, 43.0, 45.0, 37.0, 36.0, 36.0, 37.0, 38.0, 29.0, 27.0, 24.0, 27.0, 22.0, 12.0, 16.0, 15.0, 11.0, 14.0, 9.0, 7.0, 4.0, 5.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0], "bins": [-5.40234375, -5.2471923828125, -5.092041015625, -4.9368896484375, -4.78173828125, -4.6265869140625, -4.471435546875, -4.3162841796875, -4.1611328125, -4.0059814453125, -3.850830078125, -3.6956787109375, -3.54052734375, -3.3853759765625, -3.230224609375, -3.0750732421875, -2.919921875, -2.7647705078125, -2.609619140625, -2.4544677734375, -2.29931640625, -2.1441650390625, -1.989013671875, -1.8338623046875, -1.6787109375, -1.5235595703125, -1.368408203125, -1.2132568359375, -1.05810546875, -0.9029541015625, -0.747802734375, -0.5926513671875, -0.4375, -0.2823486328125, -0.127197265625, 0.0279541015625, 0.18310546875, 0.3382568359375, 0.493408203125, 0.6485595703125, 0.8037109375, 0.9588623046875, 1.114013671875, 1.2691650390625, 1.42431640625, 1.5794677734375, 1.734619140625, 1.8897705078125, 2.044921875, 2.2000732421875, 2.355224609375, 2.5103759765625, 2.66552734375, 2.8206787109375, 2.975830078125, 3.1309814453125, 3.2861328125, 3.4412841796875, 3.596435546875, 3.7515869140625, 3.90673828125, 4.0618896484375, 4.217041015625, 4.3721923828125, 4.52734375]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 7.0, 14.0, 21.0, 31.0, 55.0, 77.0, 113.0, 190.0, 257.0, 354.0, 530.0, 762.0, 1239.0, 1750.0, 2666.0, 4017.0, 5923.0, 8961.0, 13594.0, 20748.0, 31690.0, 49608.0, 76277.0, 113127.0, 152441.0, 164121.0, 132015.0, 93086.0, 60885.0, 39174.0, 25624.0, 16589.0, 10822.0, 7201.0, 4867.0, 3185.0, 2163.0, 1411.0, 977.0, 668.0, 415.0, 291.0, 201.0, 126.0, 98.0, 64.0, 49.0, 30.0, 11.0, 12.0, 7.0, 13.0, 2.0, 4.0], "bins": [-0.51025390625, -0.4957733154296875, -0.481292724609375, -0.4668121337890625, -0.45233154296875, -0.4378509521484375, -0.423370361328125, -0.4088897705078125, -0.3944091796875, -0.3799285888671875, -0.365447998046875, -0.3509674072265625, -0.33648681640625, -0.3220062255859375, -0.307525634765625, -0.2930450439453125, -0.278564453125, -0.2640838623046875, -0.249603271484375, -0.2351226806640625, -0.22064208984375, -0.2061614990234375, -0.191680908203125, -0.1772003173828125, -0.1627197265625, -0.1482391357421875, -0.133758544921875, -0.1192779541015625, -0.10479736328125, -0.0903167724609375, -0.075836181640625, -0.0613555908203125, -0.046875, -0.0323944091796875, -0.017913818359375, -0.0034332275390625, 0.01104736328125, 0.0255279541015625, 0.040008544921875, 0.0544891357421875, 0.0689697265625, 0.0834503173828125, 0.097930908203125, 0.1124114990234375, 0.12689208984375, 0.1413726806640625, 0.155853271484375, 0.1703338623046875, 0.184814453125, 0.1992950439453125, 0.213775634765625, 0.2282562255859375, 0.24273681640625, 0.2572174072265625, 0.271697998046875, 0.2861785888671875, 0.3006591796875, 0.3151397705078125, 0.329620361328125, 0.3441009521484375, 0.35858154296875, 0.3730621337890625, 0.387542724609375, 0.4020233154296875, 0.41650390625]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 4.0, 3.0, 6.0, 3.0, 10.0, 8.0, 17.0, 7.0, 11.0, 17.0, 22.0, 17.0, 29.0, 30.0, 29.0, 30.0, 34.0, 42.0, 50.0, 33.0, 47.0, 40.0, 1065.0, 33.0, 37.0, 34.0, 43.0, 37.0, 31.0, 37.0, 31.0, 26.0, 28.0, 18.0, 31.0, 11.0, 13.0, 19.0, 9.0, 7.0, 7.0, 8.0, 7.0, 3.0, 3.0, 3.0, 5.0, 2.0, 3.0], "bins": [-3.93359375, -3.8292236328125, -3.724853515625, -3.6204833984375, -3.51611328125, -3.4117431640625, -3.307373046875, -3.2030029296875, -3.0986328125, -2.9942626953125, -2.889892578125, -2.7855224609375, -2.68115234375, -2.5767822265625, -2.472412109375, -2.3680419921875, -2.263671875, -2.1593017578125, -2.054931640625, -1.9505615234375, -1.84619140625, -1.7418212890625, -1.637451171875, -1.5330810546875, -1.4287109375, -1.3243408203125, -1.219970703125, -1.1156005859375, -1.01123046875, -0.9068603515625, -0.802490234375, -0.6981201171875, -0.59375, -0.4893798828125, -0.385009765625, -0.2806396484375, -0.17626953125, -0.0718994140625, 0.032470703125, 0.1368408203125, 0.2412109375, 0.3455810546875, 0.449951171875, 0.5543212890625, 0.65869140625, 0.7630615234375, 0.867431640625, 0.9718017578125, 1.076171875, 1.1805419921875, 1.284912109375, 1.3892822265625, 1.49365234375, 1.5980224609375, 1.702392578125, 1.8067626953125, 1.9111328125, 2.0155029296875, 2.119873046875, 2.2242431640625, 2.32861328125, 2.4329833984375, 2.537353515625, 2.6417236328125, 2.74609375]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 7.0, 5.0, 8.0, 12.0, 10.0, 31.0, 34.0, 83.0, 106.0, 166.0, 276.0, 434.0, 701.0, 1065.0, 1837.0, 2882.0, 4471.0, 7062.0, 10878.0, 16859.0, 25970.0, 40017.0, 61382.0, 92321.0, 130035.0, 1200742.0, 154481.0, 116473.0, 79995.0, 52644.0, 34136.0, 22217.0, 14269.0, 9221.0, 5895.0, 3897.0, 2435.0, 1528.0, 995.0, 567.0, 357.0, 233.0, 138.0, 103.0, 55.0, 43.0, 26.0, 17.0, 5.0, 6.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.3671875, -0.3559989929199219, -0.34481048583984375, -0.3336219787597656, -0.3224334716796875, -0.3112449645996094, -0.30005645751953125, -0.2888679504394531, -0.277679443359375, -0.2664909362792969, -0.25530242919921875, -0.24411392211914062, -0.2329254150390625, -0.22173690795898438, -0.21054840087890625, -0.19935989379882812, -0.18817138671875, -0.17698287963867188, -0.16579437255859375, -0.15460586547851562, -0.1434173583984375, -0.13222885131835938, -0.12104034423828125, -0.10985183715820312, -0.098663330078125, -0.08747482299804688, -0.07628631591796875, -0.06509780883789062, -0.0539093017578125, -0.042720794677734375, -0.03153228759765625, -0.020343780517578125, -0.0091552734375, 0.002033233642578125, 0.01322174072265625, 0.024410247802734375, 0.0355987548828125, 0.046787261962890625, 0.05797576904296875, 0.06916427612304688, 0.080352783203125, 0.09154129028320312, 0.10272979736328125, 0.11391830444335938, 0.1251068115234375, 0.13629531860351562, 0.14748382568359375, 0.15867233276367188, 0.16986083984375, 0.18104934692382812, 0.19223785400390625, 0.20342636108398438, 0.2146148681640625, 0.22580337524414062, 0.23699188232421875, 0.24818038940429688, 0.259368896484375, 0.2705574035644531, 0.28174591064453125, 0.2929344177246094, 0.3041229248046875, 0.3153114318847656, 0.32649993896484375, 0.3376884460449219, 0.348876953125]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 8.0, 2.0, 5.0, 3.0, 7.0, 10.0, 14.0, 16.0, 20.0, 23.0, 21.0, 25.0, 37.0, 42.0, 50.0, 76.0, 82.0, 78.0, 73.0, 68.0, 53.0, 43.0, 50.0, 32.0, 29.0, 32.0, 14.0, 19.0, 10.0, 9.0, 11.0, 8.0, 6.0, 9.0, 5.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0029582977294921875, -0.0028679370880126953, -0.002777576446533203, -0.002687215805053711, -0.0025968551635742188, -0.0025064945220947266, -0.0024161338806152344, -0.002325773239135742, -0.00223541259765625, -0.002145051956176758, -0.0020546913146972656, -0.0019643306732177734, -0.0018739700317382812, -0.001783609390258789, -0.0016932487487792969, -0.0016028881072998047, -0.0015125274658203125, -0.0014221668243408203, -0.0013318061828613281, -0.001241445541381836, -0.0011510848999023438, -0.0010607242584228516, -0.0009703636169433594, -0.0008800029754638672, -0.000789642333984375, -0.0006992816925048828, -0.0006089210510253906, -0.0005185604095458984, -0.00042819976806640625, -0.00033783912658691406, -0.0002474784851074219, -0.0001571178436279297, -6.67572021484375e-05, 2.3603439331054688e-05, 0.00011396408081054688, 0.00020432472229003906, 0.00029468536376953125, 0.00038504600524902344, 0.0004754066467285156, 0.0005657672882080078, 0.0006561279296875, 0.0007464885711669922, 0.0008368492126464844, 0.0009272098541259766, 0.0010175704956054688, 0.001107931137084961, 0.0011982917785644531, 0.0012886524200439453, 0.0013790130615234375, 0.0014693737030029297, 0.0015597343444824219, 0.001650094985961914, 0.0017404556274414062, 0.0018308162689208984, 0.0019211769104003906, 0.002011537551879883, 0.002101898193359375, 0.002192258834838867, 0.0022826194763183594, 0.0023729801177978516, 0.0024633407592773438, 0.002553701400756836, 0.002644062042236328, 0.0027344226837158203, 0.0028247833251953125]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 9.0, 7.0, 5.0, 7.0, 12.0, 11.0, 6.0, 19.0, 31.0, 41.0, 49.0, 62.0, 107.0, 167.0, 263.0, 470.0, 1367.0, 215607.0, 826420.0, 2439.0, 550.0, 293.0, 187.0, 133.0, 74.0, 48.0, 43.0, 26.0, 24.0, 16.0, 15.0, 8.0, 5.0, 10.0, 6.0, 6.0, 0.0, 3.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.05712890625, -0.055350303649902344, -0.05357170104980469, -0.05179309844970703, -0.050014495849609375, -0.04823589324951172, -0.04645729064941406, -0.044678688049316406, -0.04290008544921875, -0.041121482849121094, -0.03934288024902344, -0.03756427764892578, -0.035785675048828125, -0.03400707244873047, -0.03222846984863281, -0.030449867248535156, -0.0286712646484375, -0.026892662048339844, -0.025114059448242188, -0.02333545684814453, -0.021556854248046875, -0.01977825164794922, -0.017999649047851562, -0.016221046447753906, -0.01444244384765625, -0.012663841247558594, -0.010885238647460938, -0.009106636047363281, -0.007328033447265625, -0.005549430847167969, -0.0037708282470703125, -0.0019922256469726562, -0.000213623046875, 0.0015649795532226562, 0.0033435821533203125, 0.005122184753417969, 0.006900787353515625, 0.008679389953613281, 0.010457992553710938, 0.012236595153808594, 0.01401519775390625, 0.015793800354003906, 0.017572402954101562, 0.01935100555419922, 0.021129608154296875, 0.02290821075439453, 0.024686813354492188, 0.026465415954589844, 0.0282440185546875, 0.030022621154785156, 0.03180122375488281, 0.03357982635498047, 0.035358428955078125, 0.03713703155517578, 0.03891563415527344, 0.040694236755371094, 0.04247283935546875, 0.044251441955566406, 0.04603004455566406, 0.04780864715576172, 0.049587249755859375, 0.05136585235595703, 0.05314445495605469, 0.054923057556152344, 0.05670166015625]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 7.0, 167.0, 644.0, 180.0, 14.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006655517499893904, -0.006295669823884964, -0.005935822147876024, -0.0055759744718670845, -0.005216127261519432, -0.004856279119849205, -0.004496431909501553, -0.004136584233492613, -0.003776736557483673, -0.0034168888814747334, -0.0030570412054657936, -0.0026971937622874975, -0.0023373460862785578, -0.001977498410269618, -0.001617650967091322, -0.0012578032910823822, -0.0008979556150734425, -0.0005381079972721636, -0.0001782603794708848, 0.00018158718012273312, 0.0005414348561316729, 0.0009012825321406126, 0.0012611299753189087, 0.0016209776513278484, 0.001980825327336788, 0.002340673003345728, 0.0027005206793546677, 0.0030603681225329638, 0.0034202157985419035, 0.0037800634745508432, 0.004139910917729139, 0.004499758593738079, 0.0048596058040857315, 0.005219453480094671, 0.005579301156103611, 0.005939148366451263, 0.0062989965081214905, 0.006658843718469143, 0.007018691394478083, 0.007378539070487022, 0.007738386746495962, 0.008098234422504902, 0.008458081632852554, 0.008817929774522781, 0.009177776984870434, 0.00953762512654066, 0.009897472336888313, 0.01025732047855854, 0.010617167688906193, 0.010977014899253845, 0.011336863040924072, 0.011696710251271725, 0.012056558392941952, 0.012416405603289604, 0.012776253744959831, 0.013136100955307484, 0.013495948165655136, 0.013855795376002789, 0.014215643517673016, 0.014575490728020668, 0.014935338869690895, 0.015295186080038548, 0.0156550332903862, 0.016014881432056427, 0.016374729573726654]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 2.0, 8.0, 10.0, 10.0, 16.0, 14.0, 16.0, 17.0, 30.0, 44.0, 39.0, 34.0, 60.0, 53.0, 32.0, 53.0, 47.0, 48.0, 52.0, 53.0, 45.0, 44.0, 31.0, 38.0, 33.0, 31.0, 27.0, 17.0, 17.0, 22.0, 8.0, 14.0, 11.0, 7.0, 11.0, 3.0, 6.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0020488500595092773, -0.0019908715039491653, -0.0019328929483890533, -0.0018749143928289413, -0.0018169358372688293, -0.0017589572817087173, -0.0017009787261486053, -0.0016430001705884933, -0.0015850216150283813, -0.0015270430594682693, -0.0014690645039081573, -0.0014110859483480453, -0.0013531073927879333, -0.0012951288372278214, -0.0012371502816677094, -0.0011791717261075974, -0.0011211931705474854, -0.0010632146149873734, -0.0010052360594272614, -0.0009472575038671494, -0.0008892789483070374, -0.0008313003927469254, -0.0007733218371868134, -0.0007153432816267014, -0.0006573647260665894, -0.0005993861705064774, -0.0005414076149463654, -0.00048342905938625336, -0.00042545050382614136, -0.00036747194826602936, -0.00030949339270591736, -0.00025151483714580536, -0.00019353628158569336, -0.00013555772602558136, -7.757917046546936e-05, -1.960061490535736e-05, 3.837794065475464e-05, 9.635649621486664e-05, 0.00015433505177497864, 0.00021231360733509064, 0.00027029216289520264, 0.00032827071845531464, 0.00038624927401542664, 0.00044422782957553864, 0.0005022063851356506, 0.0005601849406957626, 0.0006181634962558746, 0.0006761420518159866, 0.0007341206073760986, 0.0007920991629362106, 0.0008500777184963226, 0.0009080562740564346, 0.0009660348296165466, 0.0010240133851766586, 0.0010819919407367706, 0.0011399704962968826, 0.0011979490518569946, 0.0012559276074171066, 0.0013139061629772186, 0.0013718847185373306, 0.0014298632740974426, 0.0014878418296575546, 0.0015458203852176666, 0.0016037989407777786, 0.0016617774963378906]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 3.0, 5.0, 5.0, 5.0, 8.0, 14.0, 11.0, 20.0, 22.0, 18.0, 16.0, 25.0, 28.0, 23.0, 25.0, 34.0, 34.0, 41.0, 46.0, 41.0, 34.0, 41.0, 43.0, 45.0, 37.0, 36.0, 36.0, 37.0, 37.0, 30.0, 27.0, 24.0, 27.0, 22.0, 13.0, 15.0, 15.0, 11.0, 14.0, 9.0, 7.0, 4.0, 5.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0], "bins": [-5.40234375, -5.2471923828125, -5.092041015625, -4.9368896484375, -4.78173828125, -4.6265869140625, -4.471435546875, -4.3162841796875, -4.1611328125, -4.0059814453125, -3.850830078125, -3.6956787109375, -3.54052734375, -3.3853759765625, -3.230224609375, -3.0750732421875, -2.919921875, -2.7647705078125, -2.609619140625, -2.4544677734375, -2.29931640625, -2.1441650390625, -1.989013671875, -1.8338623046875, -1.6787109375, -1.5235595703125, -1.368408203125, -1.2132568359375, -1.05810546875, -0.9029541015625, -0.747802734375, -0.5926513671875, -0.4375, -0.2823486328125, -0.127197265625, 0.0279541015625, 0.18310546875, 0.3382568359375, 0.493408203125, 0.6485595703125, 0.8037109375, 0.9588623046875, 1.114013671875, 1.2691650390625, 1.42431640625, 1.5794677734375, 1.734619140625, 1.8897705078125, 2.044921875, 2.2000732421875, 2.355224609375, 2.5103759765625, 2.66552734375, 2.8206787109375, 2.975830078125, 3.1309814453125, 3.2861328125, 3.4412841796875, 3.596435546875, 3.7515869140625, 3.90673828125, 4.0618896484375, 4.217041015625, 4.3721923828125, 4.52734375]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 7.0, 9.0, 17.0, 18.0, 35.0, 50.0, 72.0, 117.0, 164.0, 243.0, 340.0, 527.0, 783.0, 1165.0, 1789.0, 2696.0, 4143.0, 6642.0, 12243.0, 26342.0, 74168.0, 315040.0, 438492.0, 96693.0, 31905.0, 14274.0, 7476.0, 4440.0, 2865.0, 1891.0, 1257.0, 781.0, 585.0, 404.0, 290.0, 180.0, 130.0, 73.0, 59.0, 41.0, 34.0, 28.0, 16.0, 10.0, 7.0, 4.0, 5.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.34765625, -4.2032470703125, -4.058837890625, -3.9144287109375, -3.77001953125, -3.6256103515625, -3.481201171875, -3.3367919921875, -3.1923828125, -3.0479736328125, -2.903564453125, -2.7591552734375, -2.61474609375, -2.4703369140625, -2.325927734375, -2.1815185546875, -2.037109375, -1.8927001953125, -1.748291015625, -1.6038818359375, -1.45947265625, -1.3150634765625, -1.170654296875, -1.0262451171875, -0.8818359375, -0.7374267578125, -0.593017578125, -0.4486083984375, -0.30419921875, -0.1597900390625, -0.015380859375, 0.1290283203125, 0.2734375, 0.4178466796875, 0.562255859375, 0.7066650390625, 0.85107421875, 0.9954833984375, 1.139892578125, 1.2843017578125, 1.4287109375, 1.5731201171875, 1.717529296875, 1.8619384765625, 2.00634765625, 2.1507568359375, 2.295166015625, 2.4395751953125, 2.583984375, 2.7283935546875, 2.872802734375, 3.0172119140625, 3.16162109375, 3.3060302734375, 3.450439453125, 3.5948486328125, 3.7392578125, 3.8836669921875, 4.028076171875, 4.1724853515625, 4.31689453125, 4.4613037109375, 4.605712890625, 4.7501220703125, 4.89453125]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 7.0, 2.0, 7.0, 10.0, 11.0, 5.0, 10.0, 16.0, 24.0, 23.0, 25.0, 24.0, 40.0, 30.0, 35.0, 36.0, 37.0, 52.0, 85.0, 176.0, 1699.0, 210.0, 79.0, 53.0, 41.0, 40.0, 34.0, 30.0, 24.0, 36.0, 26.0, 25.0, 15.0, 23.0, 12.0, 15.0, 6.0, 7.0, 8.0, 5.0, 5.0, 2.0, 2.0, 4.0, 1.0, 0.0, 2.0], "bins": [-21.859375, -21.27783203125, -20.6962890625, -20.11474609375, -19.533203125, -18.95166015625, -18.3701171875, -17.78857421875, -17.20703125, -16.62548828125, -16.0439453125, -15.46240234375, -14.880859375, -14.29931640625, -13.7177734375, -13.13623046875, -12.5546875, -11.97314453125, -11.3916015625, -10.81005859375, -10.228515625, -9.64697265625, -9.0654296875, -8.48388671875, -7.90234375, -7.32080078125, -6.7392578125, -6.15771484375, -5.576171875, -4.99462890625, -4.4130859375, -3.83154296875, -3.25, -2.66845703125, -2.0869140625, -1.50537109375, -0.923828125, -0.34228515625, 0.2392578125, 0.82080078125, 1.40234375, 1.98388671875, 2.5654296875, 3.14697265625, 3.728515625, 4.31005859375, 4.8916015625, 5.47314453125, 6.0546875, 6.63623046875, 7.2177734375, 7.79931640625, 8.380859375, 8.96240234375, 9.5439453125, 10.12548828125, 10.70703125, 11.28857421875, 11.8701171875, 12.45166015625, 13.033203125, 13.61474609375, 14.1962890625, 14.77783203125, 15.359375]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 8.0, 8.0, 12.0, 13.0, 13.0, 24.0, 28.0, 39.0, 57.0, 97.0, 113.0, 204.0, 374.0, 1153.0, 18679.0, 3091759.0, 30707.0, 1394.0, 366.0, 218.0, 122.0, 94.0, 63.0, 43.0, 36.0, 22.0, 12.0, 16.0, 8.0, 7.0, 7.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-42.28125, -40.8505859375, -39.419921875, -37.9892578125, -36.55859375, -35.1279296875, -33.697265625, -32.2666015625, -30.8359375, -29.4052734375, -27.974609375, -26.5439453125, -25.11328125, -23.6826171875, -22.251953125, -20.8212890625, -19.390625, -17.9599609375, -16.529296875, -15.0986328125, -13.66796875, -12.2373046875, -10.806640625, -9.3759765625, -7.9453125, -6.5146484375, -5.083984375, -3.6533203125, -2.22265625, -0.7919921875, 0.638671875, 2.0693359375, 3.5, 4.9306640625, 6.361328125, 7.7919921875, 9.22265625, 10.6533203125, 12.083984375, 13.5146484375, 14.9453125, 16.3759765625, 17.806640625, 19.2373046875, 20.66796875, 22.0986328125, 23.529296875, 24.9599609375, 26.390625, 27.8212890625, 29.251953125, 30.6826171875, 32.11328125, 33.5439453125, 34.974609375, 36.4052734375, 37.8359375, 39.2666015625, 40.697265625, 42.1279296875, 43.55859375, 44.9892578125, 46.419921875, 47.8505859375, 49.28125]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 6.0, 59.0, 307.0, 457.0, 161.0, 20.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-83.2296371459961, -80.72634887695312, -78.22306823730469, -75.71977996826172, -73.21649932861328, -70.71321105957031, -68.20993041992188, -65.7066421508789, -63.2033576965332, -60.7000732421875, -58.1967887878418, -55.693504333496094, -53.190216064453125, -50.68693542480469, -48.18364715576172, -45.680362701416016, -43.17707824707031, -40.67379379272461, -38.170509338378906, -35.6672248840332, -33.1639404296875, -30.660654067993164, -28.157367706298828, -25.654083251953125, -23.150798797607422, -20.64751434326172, -18.144229888916016, -15.64094352722168, -13.137659072875977, -10.634374618530273, -8.131089210510254, -5.627803802490234, -3.1245193481445312, -0.6212344169616699, 1.8820505142211914, 4.385335445404053, 6.888620376586914, 9.391904830932617, 11.895190238952637, 14.398475646972656, 16.90176010131836, 19.405044555664062, 21.908329010009766, 24.4116153717041, 26.914899826049805, 29.418184280395508, 31.921470642089844, 34.42475509643555, 36.92803955078125, 39.43132400512695, 41.934608459472656, 44.43789291381836, 46.94117736816406, 49.44446563720703, 51.947750091552734, 54.45103454589844, 56.95431900024414, 59.457603454589844, 61.96088790893555, 64.46417236328125, 66.96746063232422, 69.47074127197266, 71.97402954101562, 74.47731018066406, 76.98059844970703]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 2.0, 6.0, 6.0, 8.0, 10.0, 6.0, 17.0, 16.0, 20.0, 24.0, 16.0, 27.0, 23.0, 34.0, 32.0, 39.0, 44.0, 32.0, 38.0, 31.0, 31.0, 43.0, 52.0, 44.0, 32.0, 29.0, 41.0, 31.0, 42.0, 33.0, 28.0, 19.0, 17.0, 26.0, 24.0, 12.0, 9.0, 13.0, 13.0, 5.0, 5.0, 4.0, 6.0, 4.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-51.48713302612305, -49.892730712890625, -48.29833221435547, -46.70392990112305, -45.10953140258789, -43.51512908935547, -41.92073059082031, -40.32632827758789, -38.73192596435547, -37.13752365112305, -35.54312515258789, -33.94872283935547, -32.35432434082031, -30.75992202758789, -29.1655216217041, -27.571121215820312, -25.976722717285156, -24.382322311401367, -22.787921905517578, -21.193519592285156, -19.59912109375, -18.004718780517578, -16.41031837463379, -14.81591796875, -13.221517562866211, -11.627117156982422, -10.032716751098633, -8.438315391540527, -6.843914985656738, -5.249514579772949, -3.6551132202148438, -2.0607128143310547, -0.46631622314453125, 1.128084421157837, 2.722485065460205, 4.316885948181152, 5.911286354064941, 7.5056867599487305, 9.100088119506836, 10.694488525390625, 12.288888931274414, 13.883289337158203, 15.477689743041992, 17.07209014892578, 18.666492462158203, 20.26089096069336, 21.85529327392578, 23.44969367980957, 25.04409408569336, 26.63849449157715, 28.232894897460938, 29.82729721069336, 31.421695709228516, 33.01609802246094, 34.610496520996094, 36.204898834228516, 37.79930114746094, 39.39370346069336, 40.988101959228516, 42.58250427246094, 44.176902770996094, 45.771305084228516, 47.36570739746094, 48.960105895996094, 50.55450439453125]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 4.0, 1.0, 8.0, 1.0, 5.0, 8.0, 7.0, 11.0, 15.0, 17.0, 18.0, 24.0, 20.0, 22.0, 19.0, 27.0, 27.0, 38.0, 41.0, 34.0, 35.0, 42.0, 47.0, 42.0, 30.0, 38.0, 35.0, 36.0, 38.0, 41.0, 26.0, 29.0, 31.0, 23.0, 29.0, 18.0, 20.0, 17.0, 13.0, 13.0, 13.0, 12.0, 9.0, 5.0, 4.0, 4.0, 3.0, 2.0, 1.0, 3.0, 3.0, 0.0, 3.0], "bins": [-5.3515625, -5.19842529296875, -5.0452880859375, -4.89215087890625, -4.739013671875, -4.58587646484375, -4.4327392578125, -4.27960205078125, -4.12646484375, -3.97332763671875, -3.8201904296875, -3.66705322265625, -3.513916015625, -3.36077880859375, -3.2076416015625, -3.05450439453125, -2.9013671875, -2.74822998046875, -2.5950927734375, -2.44195556640625, -2.288818359375, -2.13568115234375, -1.9825439453125, -1.82940673828125, -1.67626953125, -1.52313232421875, -1.3699951171875, -1.21685791015625, -1.063720703125, -0.91058349609375, -0.7574462890625, -0.60430908203125, -0.451171875, -0.29803466796875, -0.1448974609375, 0.00823974609375, 0.161376953125, 0.31451416015625, 0.4676513671875, 0.62078857421875, 0.77392578125, 0.92706298828125, 1.0802001953125, 1.23333740234375, 1.386474609375, 1.53961181640625, 1.6927490234375, 1.84588623046875, 1.9990234375, 2.15216064453125, 2.3052978515625, 2.45843505859375, 2.611572265625, 2.76470947265625, 2.9178466796875, 3.07098388671875, 3.22412109375, 3.37725830078125, 3.5303955078125, 3.68353271484375, 3.836669921875, 3.98980712890625, 4.1429443359375, 4.29608154296875, 4.44921875]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 3.0, 3.0, 4.0, 12.0, 12.0, 17.0, 22.0, 30.0, 24.0, 43.0, 75.0, 98.0, 162.0, 214.0, 379.0, 527.0, 935.0, 1569.0, 2748.0, 5162.0, 10019.0, 21319.0, 50931.0, 151626.0, 528431.0, 1302299.0, 1321608.0, 542995.0, 157475.0, 52142.0, 21543.0, 10013.0, 5059.0, 2756.0, 1562.0, 946.0, 528.0, 336.0, 214.0, 145.0, 83.0, 56.0, 53.0, 22.0, 29.0, 24.0, 13.0, 5.0, 5.0, 4.0, 6.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-6.25, -6.0606689453125, -5.871337890625, -5.6820068359375, -5.49267578125, -5.3033447265625, -5.114013671875, -4.9246826171875, -4.7353515625, -4.5460205078125, -4.356689453125, -4.1673583984375, -3.97802734375, -3.7886962890625, -3.599365234375, -3.4100341796875, -3.220703125, -3.0313720703125, -2.842041015625, -2.6527099609375, -2.46337890625, -2.2740478515625, -2.084716796875, -1.8953857421875, -1.7060546875, -1.5167236328125, -1.327392578125, -1.1380615234375, -0.94873046875, -0.7593994140625, -0.570068359375, -0.3807373046875, -0.19140625, -0.0020751953125, 0.187255859375, 0.3765869140625, 0.56591796875, 0.7552490234375, 0.944580078125, 1.1339111328125, 1.3232421875, 1.5125732421875, 1.701904296875, 1.8912353515625, 2.08056640625, 2.2698974609375, 2.459228515625, 2.6485595703125, 2.837890625, 3.0272216796875, 3.216552734375, 3.4058837890625, 3.59521484375, 3.7845458984375, 3.973876953125, 4.1632080078125, 4.3525390625, 4.5418701171875, 4.731201171875, 4.9205322265625, 5.10986328125, 5.2991943359375, 5.488525390625, 5.6778564453125, 5.8671875]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 4.0, 1.0, 2.0, 5.0, 4.0, 6.0, 7.0, 18.0, 29.0, 37.0, 54.0, 63.0, 105.0, 119.0, 181.0, 228.0, 274.0, 450.0, 502.0, 471.0, 423.0, 291.0, 214.0, 171.0, 134.0, 87.0, 56.0, 41.0, 32.0, 26.0, 13.0, 11.0, 7.0, 5.0, 2.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.6640625, -11.2310791015625, -10.798095703125, -10.3651123046875, -9.93212890625, -9.4991455078125, -9.066162109375, -8.6331787109375, -8.2001953125, -7.7672119140625, -7.334228515625, -6.9012451171875, -6.46826171875, -6.0352783203125, -5.602294921875, -5.1693115234375, -4.736328125, -4.3033447265625, -3.870361328125, -3.4373779296875, -3.00439453125, -2.5714111328125, -2.138427734375, -1.7054443359375, -1.2724609375, -0.8394775390625, -0.406494140625, 0.0264892578125, 0.45947265625, 0.8924560546875, 1.325439453125, 1.7584228515625, 2.19140625, 2.6243896484375, 3.057373046875, 3.4903564453125, 3.92333984375, 4.3563232421875, 4.789306640625, 5.2222900390625, 5.6552734375, 6.0882568359375, 6.521240234375, 6.9542236328125, 7.38720703125, 7.8201904296875, 8.253173828125, 8.6861572265625, 9.119140625, 9.5521240234375, 9.985107421875, 10.4180908203125, 10.85107421875, 11.2840576171875, 11.717041015625, 12.1500244140625, 12.5830078125, 13.0159912109375, 13.448974609375, 13.8819580078125, 14.31494140625, 14.7479248046875, 15.180908203125, 15.6138916015625, 16.046875]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 3.0, 6.0, 9.0, 12.0, 18.0, 24.0, 49.0, 46.0, 70.0, 96.0, 145.0, 244.0, 405.0, 1084.0, 5460.0, 107353.0, 3670372.0, 393710.0, 12117.0, 1648.0, 558.0, 283.0, 177.0, 112.0, 82.0, 62.0, 39.0, 28.0, 22.0, 15.0, 8.0, 13.0, 4.0, 3.0, 3.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-27.5625, -26.34619140625, -25.1298828125, -23.91357421875, -22.697265625, -21.48095703125, -20.2646484375, -19.04833984375, -17.83203125, -16.61572265625, -15.3994140625, -14.18310546875, -12.966796875, -11.75048828125, -10.5341796875, -9.31787109375, -8.1015625, -6.88525390625, -5.6689453125, -4.45263671875, -3.236328125, -2.02001953125, -0.8037109375, 0.41259765625, 1.62890625, 2.84521484375, 4.0615234375, 5.27783203125, 6.494140625, 7.71044921875, 8.9267578125, 10.14306640625, 11.359375, 12.57568359375, 13.7919921875, 15.00830078125, 16.224609375, 17.44091796875, 18.6572265625, 19.87353515625, 21.08984375, 22.30615234375, 23.5224609375, 24.73876953125, 25.955078125, 27.17138671875, 28.3876953125, 29.60400390625, 30.8203125, 32.03662109375, 33.2529296875, 34.46923828125, 35.685546875, 36.90185546875, 38.1181640625, 39.33447265625, 40.55078125, 41.76708984375, 42.9833984375, 44.19970703125, 45.416015625, 46.63232421875, 47.8486328125, 49.06494140625, 50.28125]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 6.0, 20.0, 27.0, 45.0, 72.0, 108.0, 152.0, 153.0, 152.0, 113.0, 61.0, 44.0, 30.0, 19.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-123.60558319091797, -121.05137634277344, -118.49716186523438, -115.94295501708984, -113.38874816894531, -110.83454132080078, -108.28033447265625, -105.72611999511719, -103.17191314697266, -100.61770629882812, -98.06349182128906, -95.50928497314453, -92.955078125, -90.40087127685547, -87.84666442871094, -85.29244995117188, -82.73824310302734, -80.18403625488281, -77.62982177734375, -75.07561492919922, -72.52140808105469, -69.96720123291016, -67.41299438476562, -64.85877990722656, -62.30457305908203, -59.7503662109375, -57.1961555480957, -54.641944885253906, -52.087738037109375, -49.533531188964844, -46.97932052612305, -44.42510986328125, -41.87089538574219, -39.316688537597656, -36.76247787475586, -34.20826721191406, -31.65406036376953, -29.099851608276367, -26.545642852783203, -23.99143409729004, -21.437225341796875, -18.88301658630371, -16.328807830810547, -13.774599075317383, -11.220390319824219, -8.666181564331055, -6.111972808837891, -3.5577640533447266, -1.0035552978515625, 1.5506534576416016, 4.104862213134766, 6.65907096862793, 9.213279724121094, 11.767488479614258, 14.321697235107422, 16.875905990600586, 19.43011474609375, 21.984323501586914, 24.538532257080078, 27.092741012573242, 29.646949768066406, 32.20115661621094, 34.755367279052734, 37.30957794189453, 39.86378479003906]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 2.0, 8.0, 6.0, 5.0, 6.0, 2.0, 9.0, 8.0, 10.0, 6.0, 16.0, 14.0, 14.0, 23.0, 26.0, 14.0, 21.0, 24.0, 24.0, 29.0, 23.0, 35.0, 41.0, 36.0, 29.0, 46.0, 43.0, 36.0, 44.0, 37.0, 38.0, 41.0, 30.0, 34.0, 34.0, 20.0, 16.0, 21.0, 23.0, 15.0, 13.0, 16.0, 11.0, 7.0, 13.0, 6.0, 8.0, 5.0, 3.0, 4.0, 7.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-38.10260009765625, -36.93830108642578, -35.77400207519531, -34.60970687866211, -33.44540786743164, -32.28110885620117, -31.116811752319336, -29.9525146484375, -28.78821563720703, -27.623916625976562, -26.459619522094727, -25.29532241821289, -24.131023406982422, -22.966724395751953, -21.802427291870117, -20.63813018798828, -19.473831176757812, -18.309532165527344, -17.145235061645508, -15.980937004089355, -14.816638946533203, -13.65234088897705, -12.488042831420898, -11.323744773864746, -10.159446716308594, -8.995148658752441, -7.830850601196289, -6.666552543640137, -5.502254486083984, -4.337956428527832, -3.1736583709716797, -2.0093603134155273, -0.845062255859375, 0.31923580169677734, 1.4835338592529297, 2.647831916809082, 3.8121299743652344, 4.976428031921387, 6.140726089477539, 7.305024147033691, 8.469322204589844, 9.633620262145996, 10.797918319702148, 11.9622163772583, 13.126514434814453, 14.290812492370605, 15.455110549926758, 16.619407653808594, 17.783706665039062, 18.94800567626953, 20.112302780151367, 21.276599884033203, 22.440898895263672, 23.60519790649414, 24.769495010375977, 25.933792114257812, 27.09809112548828, 28.26239013671875, 29.426687240600586, 30.590984344482422, 31.75528335571289, 32.91958236694336, 34.08387756347656, 35.24817657470703, 36.4124755859375]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 8.0, 6.0, 5.0, 15.0, 5.0, 8.0, 16.0, 14.0, 23.0, 32.0, 18.0, 22.0, 36.0, 36.0, 31.0, 42.0, 40.0, 44.0, 49.0, 30.0, 37.0, 40.0, 33.0, 43.0, 40.0, 30.0, 40.0, 34.0, 24.0, 40.0, 24.0, 19.0, 20.0, 19.0, 13.0, 15.0, 11.0, 9.0, 8.0, 7.0, 6.0, 6.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-5.625, -5.458251953125, -5.29150390625, -5.124755859375, -4.9580078125, -4.791259765625, -4.62451171875, -4.457763671875, -4.291015625, -4.124267578125, -3.95751953125, -3.790771484375, -3.6240234375, -3.457275390625, -3.29052734375, -3.123779296875, -2.95703125, -2.790283203125, -2.62353515625, -2.456787109375, -2.2900390625, -2.123291015625, -1.95654296875, -1.789794921875, -1.623046875, -1.456298828125, -1.28955078125, -1.122802734375, -0.9560546875, -0.789306640625, -0.62255859375, -0.455810546875, -0.2890625, -0.122314453125, 0.04443359375, 0.211181640625, 0.3779296875, 0.544677734375, 0.71142578125, 0.878173828125, 1.044921875, 1.211669921875, 1.37841796875, 1.545166015625, 1.7119140625, 1.878662109375, 2.04541015625, 2.212158203125, 2.37890625, 2.545654296875, 2.71240234375, 2.879150390625, 3.0458984375, 3.212646484375, 3.37939453125, 3.546142578125, 3.712890625, 3.879638671875, 4.04638671875, 4.213134765625, 4.3798828125, 4.546630859375, 4.71337890625, 4.880126953125, 5.046875]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 9.0, 13.0, 16.0, 27.0, 39.0, 75.0, 85.0, 144.0, 220.0, 343.0, 562.0, 782.0, 1267.0, 1957.0, 2976.0, 4636.0, 7105.0, 11002.0, 17378.0, 27069.0, 42489.0, 66520.0, 102655.0, 150531.0, 180080.0, 148493.0, 100888.0, 65226.0, 41673.0, 26689.0, 16766.0, 10982.0, 7044.0, 4481.0, 2994.0, 1812.0, 1261.0, 778.0, 521.0, 333.0, 221.0, 145.0, 92.0, 70.0, 39.0, 28.0, 15.0, 9.0, 8.0, 5.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.54736328125, -0.5305099487304688, -0.5136566162109375, -0.49680328369140625, -0.479949951171875, -0.46309661865234375, -0.4462432861328125, -0.42938995361328125, -0.41253662109375, -0.39568328857421875, -0.3788299560546875, -0.36197662353515625, -0.345123291015625, -0.32826995849609375, -0.3114166259765625, -0.29456329345703125, -0.2777099609375, -0.26085662841796875, -0.2440032958984375, -0.22714996337890625, -0.210296630859375, -0.19344329833984375, -0.1765899658203125, -0.15973663330078125, -0.14288330078125, -0.12602996826171875, -0.1091766357421875, -0.09232330322265625, -0.075469970703125, -0.05861663818359375, -0.0417633056640625, -0.02490997314453125, -0.008056640625, 0.00879669189453125, 0.0256500244140625, 0.04250335693359375, 0.059356689453125, 0.07621002197265625, 0.0930633544921875, 0.10991668701171875, 0.12677001953125, 0.14362335205078125, 0.1604766845703125, 0.17733001708984375, 0.194183349609375, 0.21103668212890625, 0.2278900146484375, 0.24474334716796875, 0.2615966796875, 0.27845001220703125, 0.2953033447265625, 0.31215667724609375, 0.329010009765625, 0.34586334228515625, 0.3627166748046875, 0.37957000732421875, 0.39642333984375, 0.41327667236328125, 0.4301300048828125, 0.44698333740234375, 0.463836669921875, 0.48069000244140625, 0.4975433349609375, 0.5143966674804688, 0.53125]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 3.0, 4.0, 11.0, 10.0, 10.0, 15.0, 14.0, 12.0, 19.0, 22.0, 19.0, 21.0, 25.0, 33.0, 26.0, 33.0, 48.0, 40.0, 42.0, 36.0, 1066.0, 49.0, 35.0, 54.0, 44.0, 41.0, 36.0, 23.0, 28.0, 35.0, 28.0, 19.0, 23.0, 18.0, 23.0, 9.0, 16.0, 8.0, 5.0, 6.0, 8.0, 6.0, 0.0, 1.0, 4.0, 1.0, 0.0, 2.0], "bins": [-3.892578125, -3.78668212890625, -3.6807861328125, -3.57489013671875, -3.468994140625, -3.36309814453125, -3.2572021484375, -3.15130615234375, -3.04541015625, -2.93951416015625, -2.8336181640625, -2.72772216796875, -2.621826171875, -2.51593017578125, -2.4100341796875, -2.30413818359375, -2.1982421875, -2.09234619140625, -1.9864501953125, -1.88055419921875, -1.774658203125, -1.66876220703125, -1.5628662109375, -1.45697021484375, -1.35107421875, -1.24517822265625, -1.1392822265625, -1.03338623046875, -0.927490234375, -0.82159423828125, -0.7156982421875, -0.60980224609375, -0.50390625, -0.39801025390625, -0.2921142578125, -0.18621826171875, -0.080322265625, 0.02557373046875, 0.1314697265625, 0.23736572265625, 0.34326171875, 0.44915771484375, 0.5550537109375, 0.66094970703125, 0.766845703125, 0.87274169921875, 0.9786376953125, 1.08453369140625, 1.1904296875, 1.29632568359375, 1.4022216796875, 1.50811767578125, 1.614013671875, 1.71990966796875, 1.8258056640625, 1.93170166015625, 2.03759765625, 2.14349365234375, 2.2493896484375, 2.35528564453125, 2.461181640625, 2.56707763671875, 2.6729736328125, 2.77886962890625, 2.884765625]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 9.0, 5.0, 13.0, 8.0, 29.0, 47.0, 44.0, 79.0, 94.0, 188.0, 245.0, 372.0, 552.0, 904.0, 1288.0, 2064.0, 3070.0, 4614.0, 6891.0, 10818.0, 16144.0, 25087.0, 37506.0, 56598.0, 83411.0, 116957.0, 223890.0, 1117129.0, 122062.0, 88863.0, 60573.0, 40381.0, 26397.0, 17427.0, 11332.0, 7484.0, 4846.0, 3329.0, 2184.0, 1436.0, 969.0, 578.0, 390.0, 278.0, 189.0, 119.0, 85.0, 63.0, 34.0, 23.0, 23.0, 14.0, 2.0, 5.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.355224609375, -0.34415435791015625, -0.3330841064453125, -0.32201385498046875, -0.310943603515625, -0.29987335205078125, -0.2888031005859375, -0.27773284912109375, -0.26666259765625, -0.25559234619140625, -0.2445220947265625, -0.23345184326171875, -0.222381591796875, -0.21131134033203125, -0.2002410888671875, -0.18917083740234375, -0.1781005859375, -0.16703033447265625, -0.1559600830078125, -0.14488983154296875, -0.133819580078125, -0.12274932861328125, -0.1116790771484375, -0.10060882568359375, -0.08953857421875, -0.07846832275390625, -0.0673980712890625, -0.05632781982421875, -0.045257568359375, -0.03418731689453125, -0.0231170654296875, -0.01204681396484375, -0.0009765625, 0.01009368896484375, 0.0211639404296875, 0.03223419189453125, 0.043304443359375, 0.05437469482421875, 0.0654449462890625, 0.07651519775390625, 0.08758544921875, 0.09865570068359375, 0.1097259521484375, 0.12079620361328125, 0.131866455078125, 0.14293670654296875, 0.1540069580078125, 0.16507720947265625, 0.1761474609375, 0.18721771240234375, 0.1982879638671875, 0.20935821533203125, 0.220428466796875, 0.23149871826171875, 0.2425689697265625, 0.25363922119140625, 0.26470947265625, 0.27577972412109375, 0.2868499755859375, 0.29792022705078125, 0.308990478515625, 0.32006072998046875, 0.3311309814453125, 0.34220123291015625, 0.353271484375]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 5.0, 0.0, 0.0, 4.0, 1.0, 3.0, 4.0, 3.0, 5.0, 6.0, 16.0, 19.0, 11.0, 17.0, 12.0, 24.0, 21.0, 25.0, 38.0, 45.0, 53.0, 73.0, 66.0, 66.0, 75.0, 69.0, 66.0, 54.0, 38.0, 35.0, 31.0, 35.0, 16.0, 11.0, 12.0, 14.0, 12.0, 6.0, 5.0, 5.0, 2.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.003917694091796875, -0.003775477409362793, -0.003633260726928711, -0.003491044044494629, -0.003348827362060547, -0.003206610679626465, -0.003064393997192383, -0.0029221773147583008, -0.0027799606323242188, -0.0026377439498901367, -0.0024955272674560547, -0.0023533105850219727, -0.0022110939025878906, -0.0020688772201538086, -0.0019266605377197266, -0.0017844438552856445, -0.0016422271728515625, -0.0015000104904174805, -0.0013577938079833984, -0.0012155771255493164, -0.0010733604431152344, -0.0009311437606811523, -0.0007889270782470703, -0.0006467103958129883, -0.0005044937133789062, -0.0003622770309448242, -0.0002200603485107422, -7.784366607666016e-05, 6.437301635742188e-05, 0.0002065896987915039, 0.00034880638122558594, 0.000491023063659668, 0.00063323974609375, 0.000775456428527832, 0.0009176731109619141, 0.001059889793395996, 0.0012021064758300781, 0.0013443231582641602, 0.0014865398406982422, 0.0016287565231323242, 0.0017709732055664062, 0.0019131898880004883, 0.0020554065704345703, 0.0021976232528686523, 0.0023398399353027344, 0.0024820566177368164, 0.0026242733001708984, 0.0027664899826049805, 0.0029087066650390625, 0.0030509233474731445, 0.0031931400299072266, 0.0033353567123413086, 0.0034775733947753906, 0.0036197900772094727, 0.0037620067596435547, 0.0039042234420776367, 0.004046440124511719, 0.004188656806945801, 0.004330873489379883, 0.004473090171813965, 0.004615306854248047, 0.004757523536682129, 0.004899740219116211, 0.005041956901550293, 0.005184173583984375]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 5.0, 7.0, 12.0, 19.0, 18.0, 24.0, 28.0, 47.0, 66.0, 93.0, 136.0, 178.0, 296.0, 521.0, 2716.0, 823777.0, 217757.0, 1543.0, 449.0, 282.0, 157.0, 127.0, 70.0, 55.0, 34.0, 37.0, 25.0, 21.0, 14.0, 14.0, 6.0, 3.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 0.0, 1.0], "bins": [-0.10418701171875, -0.1013631820678711, -0.09853935241699219, -0.09571552276611328, -0.09289169311523438, -0.09006786346435547, -0.08724403381347656, -0.08442020416259766, -0.08159637451171875, -0.07877254486083984, -0.07594871520996094, -0.07312488555908203, -0.07030105590820312, -0.06747722625732422, -0.06465339660644531, -0.061829566955566406, -0.0590057373046875, -0.056181907653808594, -0.05335807800292969, -0.05053424835205078, -0.047710418701171875, -0.04488658905029297, -0.04206275939941406, -0.039238929748535156, -0.03641510009765625, -0.033591270446777344, -0.030767440795898438, -0.02794361114501953, -0.025119781494140625, -0.02229595184326172, -0.019472122192382812, -0.016648292541503906, -0.013824462890625, -0.011000633239746094, -0.008176803588867188, -0.005352973937988281, -0.002529144287109375, 0.00029468536376953125, 0.0031185150146484375, 0.005942344665527344, 0.00876617431640625, 0.011590003967285156, 0.014413833618164062, 0.01723766326904297, 0.020061492919921875, 0.02288532257080078, 0.025709152221679688, 0.028532981872558594, 0.0313568115234375, 0.034180641174316406, 0.03700447082519531, 0.03982830047607422, 0.042652130126953125, 0.04547595977783203, 0.04829978942871094, 0.051123619079589844, 0.05394744873046875, 0.056771278381347656, 0.05959510803222656, 0.06241893768310547, 0.06524276733398438, 0.06806659698486328, 0.07089042663574219, 0.0737142562866211, 0.0765380859375]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 13.0, 850.0, 151.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0566568598151207, -0.05529935285449028, -0.05394184589385986, -0.052584342658519745, -0.05122683569788933, -0.04986932873725891, -0.048511821776628494, -0.04715431481599808, -0.04579680785536766, -0.044439300894737244, -0.04308179393410683, -0.04172428697347641, -0.04036678373813629, -0.039009276777505875, -0.03765176981687546, -0.03629426285624504, -0.034936755895614624, -0.03357924893498421, -0.03222174197435379, -0.030864236876368523, -0.029506729915738106, -0.028149224817752838, -0.02679171785712242, -0.025434210896492004, -0.024076707661151886, -0.02271920070052147, -0.0213616956025362, -0.020004188641905785, -0.018646681681275368, -0.0172891765832901, -0.015931669622659683, -0.014574162662029266, -0.013216657564043999, -0.011859151534736156, -0.01050164457410574, -0.009144138544797897, -0.007786632049828768, -0.006429125554859638, -0.005071619525551796, -0.003714112564921379, -0.002356606535613537, -0.000999100157059729, 0.00035840622149407864, 0.0017159124836325645, 0.003073418978601694, 0.004430925473570824, 0.005788431502878666, 0.007145938463509083, 0.008503444492816925, 0.009860950522124767, 0.011218457482755184, 0.012575963512063026, 0.013933470472693443, 0.015290976502001286, 0.016648482531309128, 0.018005989491939545, 0.01936349645256996, 0.02072100341320038, 0.022078508511185646, 0.023436015471816063, 0.02479352243244648, 0.026151027530431747, 0.027508534491062164, 0.02886604145169258, 0.03022354654967785]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 5.0, 5.0, 4.0, 5.0, 11.0, 14.0, 20.0, 21.0, 23.0, 19.0, 35.0, 32.0, 34.0, 43.0, 45.0, 45.0, 42.0, 58.0, 37.0, 53.0, 44.0, 42.0, 42.0, 42.0, 42.0, 41.0, 35.0, 33.0, 27.0, 15.0, 23.0, 20.0, 7.0, 18.0, 11.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0031978487968444824, -0.0031014643609523773, -0.003005079925060272, -0.002908695489168167, -0.002812311053276062, -0.002715926617383957, -0.002619542181491852, -0.0025231577455997467, -0.0024267733097076416, -0.0023303888738155365, -0.0022340044379234314, -0.0021376200020313263, -0.002041235566139221, -0.001944851130247116, -0.001848466694355011, -0.0017520822584629059, -0.0016556978225708008, -0.0015593133866786957, -0.0014629289507865906, -0.0013665445148944855, -0.0012701600790023804, -0.0011737756431102753, -0.0010773912072181702, -0.000981006771326065, -0.00088462233543396, -0.0007882378995418549, -0.0006918534636497498, -0.0005954690277576447, -0.0004990845918655396, -0.00040270015597343445, -0.00030631572008132935, -0.00020993128418922424, -0.00011354684829711914, -1.7162412405014038e-05, 7.922202348709106e-05, 0.00017560645937919617, 0.00027199089527130127, 0.00036837533116340637, 0.0004647597670555115, 0.0005611442029476166, 0.0006575286388397217, 0.0007539130747318268, 0.0008502975106239319, 0.000946681946516037, 0.001043066382408142, 0.0011394508183002472, 0.0012358352541923523, 0.0013322196900844574, 0.0014286041259765625, 0.0015249885618686676, 0.0016213729977607727, 0.0017177574336528778, 0.001814141869544983, 0.001910526305437088, 0.002006910741329193, 0.0021032951772212982, 0.0021996796131134033, 0.0022960640490055084, 0.0023924484848976135, 0.0024888329207897186, 0.0025852173566818237, 0.002681601792573929, 0.002777986228466034, 0.002874370664358139, 0.002970755100250244]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 8.0, 6.0, 5.0, 15.0, 5.0, 8.0, 16.0, 14.0, 23.0, 32.0, 18.0, 22.0, 36.0, 36.0, 31.0, 41.0, 41.0, 44.0, 49.0, 30.0, 37.0, 40.0, 33.0, 43.0, 40.0, 30.0, 40.0, 34.0, 24.0, 40.0, 24.0, 19.0, 20.0, 19.0, 13.0, 15.0, 11.0, 9.0, 8.0, 7.0, 6.0, 6.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-5.625, -5.458251953125, -5.29150390625, -5.124755859375, -4.9580078125, -4.791259765625, -4.62451171875, -4.457763671875, -4.291015625, -4.124267578125, -3.95751953125, -3.790771484375, -3.6240234375, -3.457275390625, -3.29052734375, -3.123779296875, -2.95703125, -2.790283203125, -2.62353515625, -2.456787109375, -2.2900390625, -2.123291015625, -1.95654296875, -1.789794921875, -1.623046875, -1.456298828125, -1.28955078125, -1.122802734375, -0.9560546875, -0.789306640625, -0.62255859375, -0.455810546875, -0.2890625, -0.122314453125, 0.04443359375, 0.211181640625, 0.3779296875, 0.544677734375, 0.71142578125, 0.878173828125, 1.044921875, 1.211669921875, 1.37841796875, 1.545166015625, 1.7119140625, 1.878662109375, 2.04541015625, 2.212158203125, 2.37890625, 2.545654296875, 2.71240234375, 2.879150390625, 3.0458984375, 3.212646484375, 3.37939453125, 3.546142578125, 3.712890625, 3.879638671875, 4.04638671875, 4.213134765625, 4.3798828125, 4.546630859375, 4.71337890625, 4.880126953125, 5.046875]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 9.0, 4.0, 4.0, 6.0, 13.0, 24.0, 35.0, 33.0, 79.0, 91.0, 129.0, 187.0, 282.0, 410.0, 537.0, 849.0, 1288.0, 1938.0, 3205.0, 5699.0, 11385.0, 26710.0, 78535.0, 295515.0, 427141.0, 123202.0, 38021.0, 15156.0, 7294.0, 3963.0, 2262.0, 1478.0, 935.0, 651.0, 451.0, 357.0, 225.0, 136.0, 97.0, 71.0, 57.0, 29.0, 27.0, 11.0, 12.0, 8.0, 8.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.05859375, -3.91949462890625, -3.7803955078125, -3.64129638671875, -3.502197265625, -3.36309814453125, -3.2239990234375, -3.08489990234375, -2.94580078125, -2.80670166015625, -2.6676025390625, -2.52850341796875, -2.389404296875, -2.25030517578125, -2.1112060546875, -1.97210693359375, -1.8330078125, -1.69390869140625, -1.5548095703125, -1.41571044921875, -1.276611328125, -1.13751220703125, -0.9984130859375, -0.85931396484375, -0.72021484375, -0.58111572265625, -0.4420166015625, -0.30291748046875, -0.163818359375, -0.02471923828125, 0.1143798828125, 0.25347900390625, 0.392578125, 0.53167724609375, 0.6707763671875, 0.80987548828125, 0.948974609375, 1.08807373046875, 1.2271728515625, 1.36627197265625, 1.50537109375, 1.64447021484375, 1.7835693359375, 1.92266845703125, 2.061767578125, 2.20086669921875, 2.3399658203125, 2.47906494140625, 2.6181640625, 2.75726318359375, 2.8963623046875, 3.03546142578125, 3.174560546875, 3.31365966796875, 3.4527587890625, 3.59185791015625, 3.73095703125, 3.87005615234375, 4.0091552734375, 4.14825439453125, 4.287353515625, 4.42645263671875, 4.5655517578125, 4.70465087890625, 4.84375]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 5.0, 1.0, 7.0, 5.0, 4.0, 5.0, 6.0, 6.0, 8.0, 11.0, 11.0, 14.0, 15.0, 21.0, 26.0, 28.0, 26.0, 35.0, 33.0, 32.0, 37.0, 43.0, 60.0, 105.0, 345.0, 1569.0, 127.0, 72.0, 42.0, 43.0, 28.0, 34.0, 37.0, 32.0, 22.0, 26.0, 17.0, 19.0, 21.0, 14.0, 11.0, 6.0, 11.0, 6.0, 11.0, 3.0, 7.0, 6.0, 2.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.9375, -16.393310546875, -15.84912109375, -15.304931640625, -14.7607421875, -14.216552734375, -13.67236328125, -13.128173828125, -12.583984375, -12.039794921875, -11.49560546875, -10.951416015625, -10.4072265625, -9.863037109375, -9.31884765625, -8.774658203125, -8.23046875, -7.686279296875, -7.14208984375, -6.597900390625, -6.0537109375, -5.509521484375, -4.96533203125, -4.421142578125, -3.876953125, -3.332763671875, -2.78857421875, -2.244384765625, -1.7001953125, -1.156005859375, -0.61181640625, -0.067626953125, 0.4765625, 1.020751953125, 1.56494140625, 2.109130859375, 2.6533203125, 3.197509765625, 3.74169921875, 4.285888671875, 4.830078125, 5.374267578125, 5.91845703125, 6.462646484375, 7.0068359375, 7.551025390625, 8.09521484375, 8.639404296875, 9.18359375, 9.727783203125, 10.27197265625, 10.816162109375, 11.3603515625, 11.904541015625, 12.44873046875, 12.992919921875, 13.537109375, 14.081298828125, 14.62548828125, 15.169677734375, 15.7138671875, 16.258056640625, 16.80224609375, 17.346435546875, 17.890625]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 5.0, 2.0, 4.0, 9.0, 6.0, 11.0, 12.0, 7.0, 9.0, 19.0, 14.0, 21.0, 35.0, 25.0, 42.0, 55.0, 85.0, 97.0, 107.0, 167.0, 218.0, 376.0, 1278.0, 17145.0, 3054831.0, 67267.0, 2312.0, 523.0, 286.0, 185.0, 118.0, 92.0, 76.0, 52.0, 45.0, 34.0, 25.0, 20.0, 22.0, 10.0, 8.0, 10.0, 5.0, 8.0, 6.0, 8.0, 10.0, 6.0, 3.0, 3.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-35.84375, -34.74609375, -33.6484375, -32.55078125, -31.453125, -30.35546875, -29.2578125, -28.16015625, -27.0625, -25.96484375, -24.8671875, -23.76953125, -22.671875, -21.57421875, -20.4765625, -19.37890625, -18.28125, -17.18359375, -16.0859375, -14.98828125, -13.890625, -12.79296875, -11.6953125, -10.59765625, -9.5, -8.40234375, -7.3046875, -6.20703125, -5.109375, -4.01171875, -2.9140625, -1.81640625, -0.71875, 0.37890625, 1.4765625, 2.57421875, 3.671875, 4.76953125, 5.8671875, 6.96484375, 8.0625, 9.16015625, 10.2578125, 11.35546875, 12.453125, 13.55078125, 14.6484375, 15.74609375, 16.84375, 17.94140625, 19.0390625, 20.13671875, 21.234375, 22.33203125, 23.4296875, 24.52734375, 25.625, 26.72265625, 27.8203125, 28.91796875, 30.015625, 31.11328125, 32.2109375, 33.30859375, 34.40625]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [37.0, 929.0, 49.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.242090225219727, -3.6338396072387695, 2.9744110107421875, 9.582662582397461, 16.1909122467041, 22.799161911010742, 29.40741539001465, 36.015663146972656, 42.62391662597656, 49.2321662902832, 55.840415954589844, 62.44866943359375, 69.05691528320312, 75.66516876220703, 82.27342224121094, 88.88166809082031, 95.48992156982422, 102.09817504882812, 108.7064208984375, 115.3146743774414, 121.92292785644531, 128.5311737060547, 135.13943481445312, 141.7476806640625, 148.35592651367188, 154.96417236328125, 161.5724334716797, 168.18067932128906, 174.78892517089844, 181.39718627929688, 188.00543212890625, 194.61367797851562, 201.221923828125, 207.83016967773438, 214.4384307861328, 221.0466766357422, 227.65492248535156, 234.26318359375, 240.87142944335938, 247.47967529296875, 254.08792114257812, 260.6961669921875, 267.3044128417969, 273.91265869140625, 280.52093505859375, 287.1291809082031, 293.7374267578125, 300.3456726074219, 306.95391845703125, 313.5621643066406, 320.17041015625, 326.7786865234375, 333.3869323730469, 339.99517822265625, 346.6034240722656, 353.211669921875, 359.8199462890625, 366.4281921386719, 373.03643798828125, 379.64471435546875, 386.2529602050781, 392.8612060546875, 399.4694519042969, 406.07769775390625, 412.6859436035156]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 2.0, 7.0, 3.0, 6.0, 9.0, 5.0, 11.0, 7.0, 18.0, 17.0, 21.0, 22.0, 20.0, 17.0, 25.0, 36.0, 38.0, 27.0, 37.0, 45.0, 43.0, 28.0, 37.0, 43.0, 47.0, 35.0, 35.0, 28.0, 36.0, 44.0, 39.0, 31.0, 26.0, 26.0, 24.0, 17.0, 22.0, 15.0, 13.0, 7.0, 10.0, 5.0, 9.0, 5.0, 7.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-51.54712677001953, -50.032745361328125, -48.51836013793945, -47.00397872924805, -45.489593505859375, -43.97521209716797, -42.46083068847656, -40.94644546508789, -39.43206024169922, -37.91767883300781, -36.40329360961914, -34.888912200927734, -33.37452697753906, -31.860145568847656, -30.345762252807617, -28.831378936767578, -27.316997528076172, -25.802614212036133, -24.288230895996094, -22.773849487304688, -21.259464263916016, -19.74508285522461, -18.23069953918457, -16.71631622314453, -15.201932907104492, -13.687549591064453, -12.173166275024414, -10.658783912658691, -9.144400596618652, -7.630017280578613, -6.115634918212891, -4.601251602172852, -3.0868682861328125, -1.5724852085113525, -0.05810213088989258, 1.4562807083129883, 2.9706640243530273, 4.485047340393066, 5.999429702758789, 7.513813018798828, 9.028196334838867, 10.542579650878906, 12.056962966918945, 13.571345329284668, 15.085728645324707, 16.600112915039062, 18.11449432373047, 19.628877639770508, 21.143260955810547, 22.657644271850586, 24.172027587890625, 25.68640899658203, 27.200794219970703, 28.71517562866211, 30.22955894470215, 31.743942260742188, 33.258323669433594, 34.772705078125, 36.28709030151367, 37.80147171020508, 39.31585693359375, 40.830238342285156, 42.34461975097656, 43.859004974365234, 45.373390197753906]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 7.0, 12.0, 8.0, 8.0, 7.0, 8.0, 12.0, 21.0, 24.0, 18.0, 25.0, 27.0, 34.0, 40.0, 39.0, 33.0, 39.0, 53.0, 41.0, 43.0, 34.0, 40.0, 36.0, 37.0, 42.0, 27.0, 46.0, 29.0, 27.0, 20.0, 33.0, 25.0, 19.0, 20.0, 16.0, 12.0, 7.0, 8.0, 8.0, 5.0, 4.0, 7.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-5.9609375, -5.78814697265625, -5.6153564453125, -5.44256591796875, -5.269775390625, -5.09698486328125, -4.9241943359375, -4.75140380859375, -4.57861328125, -4.40582275390625, -4.2330322265625, -4.06024169921875, -3.887451171875, -3.71466064453125, -3.5418701171875, -3.36907958984375, -3.1962890625, -3.02349853515625, -2.8507080078125, -2.67791748046875, -2.505126953125, -2.33233642578125, -2.1595458984375, -1.98675537109375, -1.81396484375, -1.64117431640625, -1.4683837890625, -1.29559326171875, -1.122802734375, -0.95001220703125, -0.7772216796875, -0.60443115234375, -0.431640625, -0.25885009765625, -0.0860595703125, 0.08673095703125, 0.259521484375, 0.43231201171875, 0.6051025390625, 0.77789306640625, 0.95068359375, 1.12347412109375, 1.2962646484375, 1.46905517578125, 1.641845703125, 1.81463623046875, 1.9874267578125, 2.16021728515625, 2.3330078125, 2.50579833984375, 2.6785888671875, 2.85137939453125, 3.024169921875, 3.19696044921875, 3.3697509765625, 3.54254150390625, 3.71533203125, 3.88812255859375, 4.0609130859375, 4.23370361328125, 4.406494140625, 4.57928466796875, 4.7520751953125, 4.92486572265625, 5.09765625]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 7.0, 8.0, 11.0, 8.0, 11.0, 16.0, 21.0, 13.0, 21.0, 29.0, 29.0, 45.0, 52.0, 67.0, 96.0, 159.0, 369.0, 2157.0, 26198.0, 1786726.0, 2340829.0, 34047.0, 2370.0, 402.0, 133.0, 107.0, 72.0, 50.0, 46.0, 26.0, 26.0, 28.0, 16.0, 19.0, 14.0, 11.0, 10.0, 8.0, 8.0, 3.0, 7.0, 3.0, 3.0, 1.0, 2.0, 3.0, 2.0, 2.0], "bins": [-30.796875, -29.9423828125, -29.087890625, -28.2333984375, -27.37890625, -26.5244140625, -25.669921875, -24.8154296875, -23.9609375, -23.1064453125, -22.251953125, -21.3974609375, -20.54296875, -19.6884765625, -18.833984375, -17.9794921875, -17.125, -16.2705078125, -15.416015625, -14.5615234375, -13.70703125, -12.8525390625, -11.998046875, -11.1435546875, -10.2890625, -9.4345703125, -8.580078125, -7.7255859375, -6.87109375, -6.0166015625, -5.162109375, -4.3076171875, -3.453125, -2.5986328125, -1.744140625, -0.8896484375, -0.03515625, 0.8193359375, 1.673828125, 2.5283203125, 3.3828125, 4.2373046875, 5.091796875, 5.9462890625, 6.80078125, 7.6552734375, 8.509765625, 9.3642578125, 10.21875, 11.0732421875, 11.927734375, 12.7822265625, 13.63671875, 14.4912109375, 15.345703125, 16.2001953125, 17.0546875, 17.9091796875, 18.763671875, 19.6181640625, 20.47265625, 21.3271484375, 22.181640625, 23.0361328125, 23.890625]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 2.0, 6.0, 4.0, 12.0, 8.0, 18.0, 23.0, 37.0, 42.0, 54.0, 91.0, 134.0, 161.0, 226.0, 327.0, 405.0, 513.0, 489.0, 427.0, 330.0, 229.0, 155.0, 131.0, 82.0, 59.0, 28.0, 31.0, 14.0, 11.0, 10.0, 6.0, 6.0, 3.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.3515625, -11.924072265625, -11.49658203125, -11.069091796875, -10.6416015625, -10.214111328125, -9.78662109375, -9.359130859375, -8.931640625, -8.504150390625, -8.07666015625, -7.649169921875, -7.2216796875, -6.794189453125, -6.36669921875, -5.939208984375, -5.51171875, -5.084228515625, -4.65673828125, -4.229248046875, -3.8017578125, -3.374267578125, -2.94677734375, -2.519287109375, -2.091796875, -1.664306640625, -1.23681640625, -0.809326171875, -0.3818359375, 0.045654296875, 0.47314453125, 0.900634765625, 1.328125, 1.755615234375, 2.18310546875, 2.610595703125, 3.0380859375, 3.465576171875, 3.89306640625, 4.320556640625, 4.748046875, 5.175537109375, 5.60302734375, 6.030517578125, 6.4580078125, 6.885498046875, 7.31298828125, 7.740478515625, 8.16796875, 8.595458984375, 9.02294921875, 9.450439453125, 9.8779296875, 10.305419921875, 10.73291015625, 11.160400390625, 11.587890625, 12.015380859375, 12.44287109375, 12.870361328125, 13.2978515625, 13.725341796875, 14.15283203125, 14.580322265625, 15.0078125]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 6.0, 5.0, 12.0, 13.0, 12.0, 21.0, 31.0, 42.0, 54.0, 62.0, 98.0, 139.0, 186.0, 296.0, 547.0, 1692.0, 21048.0, 1729504.0, 2410485.0, 26489.0, 1977.0, 526.0, 315.0, 188.0, 132.0, 104.0, 83.0, 56.0, 45.0, 18.0, 26.0, 16.0, 20.0, 6.0, 8.0, 11.0, 3.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-42.53125, -41.20361328125, -39.8759765625, -38.54833984375, -37.220703125, -35.89306640625, -34.5654296875, -33.23779296875, -31.91015625, -30.58251953125, -29.2548828125, -27.92724609375, -26.599609375, -25.27197265625, -23.9443359375, -22.61669921875, -21.2890625, -19.96142578125, -18.6337890625, -17.30615234375, -15.978515625, -14.65087890625, -13.3232421875, -11.99560546875, -10.66796875, -9.34033203125, -8.0126953125, -6.68505859375, -5.357421875, -4.02978515625, -2.7021484375, -1.37451171875, -0.046875, 1.28076171875, 2.6083984375, 3.93603515625, 5.263671875, 6.59130859375, 7.9189453125, 9.24658203125, 10.57421875, 11.90185546875, 13.2294921875, 14.55712890625, 15.884765625, 17.21240234375, 18.5400390625, 19.86767578125, 21.1953125, 22.52294921875, 23.8505859375, 25.17822265625, 26.505859375, 27.83349609375, 29.1611328125, 30.48876953125, 31.81640625, 33.14404296875, 34.4716796875, 35.79931640625, 37.126953125, 38.45458984375, 39.7822265625, 41.10986328125, 42.4375]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 13.0, 26.0, 67.0, 90.0, 142.0, 225.0, 167.0, 140.0, 71.0, 45.0, 17.0, 8.0, 1.0, 3.0], "bins": [-175.13687133789062, -171.99627685546875, -168.85569763183594, -165.71511840820312, -162.57452392578125, -159.43392944335938, -156.29335021972656, -153.15277099609375, -150.01217651367188, -146.87158203125, -143.7310028076172, -140.59042358398438, -137.4498291015625, -134.30923461914062, -131.1686553955078, -128.028076171875, -124.88748168945312, -121.74689483642578, -118.60630798339844, -115.4657211303711, -112.32513427734375, -109.1845474243164, -106.04396057128906, -102.90337371826172, -99.76278686523438, -96.62220001220703, -93.48161315917969, -90.34102630615234, -87.200439453125, -84.05985260009766, -80.91926574707031, -77.77867889404297, -74.63809204101562, -71.49750518798828, -68.35691833496094, -65.2163314819336, -62.07574462890625, -58.935157775878906, -55.79457092285156, -52.65398406982422, -49.513397216796875, -46.37281036376953, -43.23222351074219, -40.091636657714844, -36.9510498046875, -33.810462951660156, -30.669876098632812, -27.52928924560547, -24.388702392578125, -21.24811553955078, -18.107528686523438, -14.966941833496094, -11.82635498046875, -8.685768127441406, -5.5451812744140625, -2.4045944213867188, 0.735992431640625, 3.8765792846679688, 7.0171661376953125, 10.157752990722656, 13.29833984375, 16.438926696777344, 19.579513549804688, 22.72010040283203, 25.860687255859375]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 4.0, 3.0, 9.0, 10.0, 1.0, 12.0, 15.0, 6.0, 11.0, 10.0, 18.0, 21.0, 25.0, 21.0, 29.0, 28.0, 27.0, 26.0, 25.0, 37.0, 51.0, 31.0, 43.0, 27.0, 50.0, 39.0, 37.0, 36.0, 36.0, 34.0, 35.0, 28.0, 27.0, 30.0, 21.0, 18.0, 24.0, 24.0, 19.0, 15.0, 11.0, 5.0, 4.0, 5.0, 8.0, 2.0, 3.0, 2.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-35.52217102050781, -34.38365936279297, -33.245147705078125, -32.10663604736328, -30.968124389648438, -29.829612731933594, -28.691099166870117, -27.552587509155273, -26.41407585144043, -25.275564193725586, -24.137052536010742, -22.9985408782959, -21.860027313232422, -20.721515655517578, -19.583003997802734, -18.44449234008789, -17.305980682373047, -16.167469024658203, -15.02895736694336, -13.8904447555542, -12.751933097839355, -11.613421440124512, -10.474908828735352, -9.336397171020508, -8.197885513305664, -7.05937385559082, -5.920861721038818, -4.782349586486816, -3.6438379287719727, -2.505326271057129, -1.366814136505127, -0.228302001953125, 0.9102096557617188, 2.0487215518951416, 3.1872334480285645, 4.325745582580566, 5.46425724029541, 6.602768898010254, 7.741281032562256, 8.879793167114258, 10.018304824829102, 11.156816482543945, 12.295328140258789, 13.43384075164795, 14.572352409362793, 15.710864067077637, 16.849376678466797, 17.98788833618164, 19.126399993896484, 20.264911651611328, 21.403423309326172, 22.541934967041016, 23.68044662475586, 24.818958282470703, 25.95747184753418, 27.095983505249023, 28.234495162963867, 29.37300682067871, 30.511518478393555, 31.6500301361084, 32.788543701171875, 33.92705535888672, 35.06556701660156, 36.204078674316406, 37.34259033203125]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 6.0, 7.0, 6.0, 9.0, 9.0, 11.0, 13.0, 11.0, 16.0, 17.0, 18.0, 27.0, 25.0, 35.0, 26.0, 29.0, 40.0, 23.0, 40.0, 34.0, 32.0, 35.0, 43.0, 33.0, 45.0, 24.0, 29.0, 36.0, 31.0, 43.0, 32.0, 18.0, 25.0, 20.0, 18.0, 25.0, 20.0, 12.0, 11.0, 13.0, 10.0, 9.0, 12.0, 6.0, 5.0, 8.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0], "bins": [-4.82421875, -4.66900634765625, -4.5137939453125, -4.35858154296875, -4.203369140625, -4.04815673828125, -3.8929443359375, -3.73773193359375, -3.58251953125, -3.42730712890625, -3.2720947265625, -3.11688232421875, -2.961669921875, -2.80645751953125, -2.6512451171875, -2.49603271484375, -2.3408203125, -2.18560791015625, -2.0303955078125, -1.87518310546875, -1.719970703125, -1.56475830078125, -1.4095458984375, -1.25433349609375, -1.09912109375, -0.94390869140625, -0.7886962890625, -0.63348388671875, -0.478271484375, -0.32305908203125, -0.1678466796875, -0.01263427734375, 0.142578125, 0.29779052734375, 0.4530029296875, 0.60821533203125, 0.763427734375, 0.91864013671875, 1.0738525390625, 1.22906494140625, 1.38427734375, 1.53948974609375, 1.6947021484375, 1.84991455078125, 2.005126953125, 2.16033935546875, 2.3155517578125, 2.47076416015625, 2.6259765625, 2.78118896484375, 2.9364013671875, 3.09161376953125, 3.246826171875, 3.40203857421875, 3.5572509765625, 3.71246337890625, 3.86767578125, 4.02288818359375, 4.1781005859375, 4.33331298828125, 4.488525390625, 4.64373779296875, 4.7989501953125, 4.95416259765625, 5.109375]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 9.0, 5.0, 17.0, 39.0, 34.0, 78.0, 118.0, 198.0, 333.0, 597.0, 936.0, 1558.0, 2614.0, 4113.0, 7081.0, 11535.0, 19185.0, 33461.0, 57909.0, 100157.0, 161772.0, 208330.0, 173416.0, 110378.0, 64576.0, 36757.0, 21404.0, 12731.0, 7497.0, 4664.0, 2830.0, 1668.0, 984.0, 656.0, 358.0, 213.0, 138.0, 69.0, 59.0, 37.0, 19.0, 12.0, 9.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6416015625, -0.6212921142578125, -0.600982666015625, -0.5806732177734375, -0.56036376953125, -0.5400543212890625, -0.519744873046875, -0.4994354248046875, -0.4791259765625, -0.4588165283203125, -0.438507080078125, -0.4181976318359375, -0.39788818359375, -0.3775787353515625, -0.357269287109375, -0.3369598388671875, -0.316650390625, -0.2963409423828125, -0.276031494140625, -0.2557220458984375, -0.23541259765625, -0.2151031494140625, -0.194793701171875, -0.1744842529296875, -0.1541748046875, -0.1338653564453125, -0.113555908203125, -0.0932464599609375, -0.07293701171875, -0.0526275634765625, -0.032318115234375, -0.0120086669921875, 0.00830078125, 0.0286102294921875, 0.048919677734375, 0.0692291259765625, 0.08953857421875, 0.1098480224609375, 0.130157470703125, 0.1504669189453125, 0.1707763671875, 0.1910858154296875, 0.211395263671875, 0.2317047119140625, 0.25201416015625, 0.2723236083984375, 0.292633056640625, 0.3129425048828125, 0.333251953125, 0.3535614013671875, 0.373870849609375, 0.3941802978515625, 0.41448974609375, 0.4347991943359375, 0.455108642578125, 0.4754180908203125, 0.4957275390625, 0.5160369873046875, 0.536346435546875, 0.5566558837890625, 0.57696533203125, 0.5972747802734375, 0.617584228515625, 0.6378936767578125, 0.658203125]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 4.0, 1.0, 6.0, 4.0, 6.0, 8.0, 4.0, 8.0, 12.0, 23.0, 15.0, 18.0, 18.0, 27.0, 25.0, 32.0, 17.0, 38.0, 36.0, 34.0, 32.0, 42.0, 23.0, 39.0, 1063.0, 38.0, 29.0, 51.0, 34.0, 35.0, 33.0, 31.0, 31.0, 30.0, 26.0, 24.0, 28.0, 8.0, 14.0, 16.0, 12.0, 12.0, 4.0, 13.0, 8.0, 6.0, 4.0, 1.0, 8.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.3671875, -3.26776123046875, -3.1683349609375, -3.06890869140625, -2.969482421875, -2.87005615234375, -2.7706298828125, -2.67120361328125, -2.57177734375, -2.47235107421875, -2.3729248046875, -2.27349853515625, -2.174072265625, -2.07464599609375, -1.9752197265625, -1.87579345703125, -1.7763671875, -1.67694091796875, -1.5775146484375, -1.47808837890625, -1.378662109375, -1.27923583984375, -1.1798095703125, -1.08038330078125, -0.98095703125, -0.88153076171875, -0.7821044921875, -0.68267822265625, -0.583251953125, -0.48382568359375, -0.3843994140625, -0.28497314453125, -0.185546875, -0.08612060546875, 0.0133056640625, 0.11273193359375, 0.212158203125, 0.31158447265625, 0.4110107421875, 0.51043701171875, 0.60986328125, 0.70928955078125, 0.8087158203125, 0.90814208984375, 1.007568359375, 1.10699462890625, 1.2064208984375, 1.30584716796875, 1.4052734375, 1.50469970703125, 1.6041259765625, 1.70355224609375, 1.802978515625, 1.90240478515625, 2.0018310546875, 2.10125732421875, 2.20068359375, 2.30010986328125, 2.3995361328125, 2.49896240234375, 2.598388671875, 2.69781494140625, 2.7972412109375, 2.89666748046875, 2.99609375]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 8.0, 2.0, 8.0, 13.0, 19.0, 34.0, 40.0, 67.0, 112.0, 182.0, 332.0, 508.0, 807.0, 1373.0, 2168.0, 3775.0, 5909.0, 9830.0, 16190.0, 26735.0, 43580.0, 70906.0, 110714.0, 155703.0, 1224796.0, 149971.0, 103778.0, 65905.0, 40903.0, 24510.0, 14910.0, 8999.0, 5554.0, 3455.0, 2085.0, 1244.0, 755.0, 479.0, 289.0, 182.0, 114.0, 72.0, 44.0, 27.0, 15.0, 12.0, 9.0, 4.0, 9.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.420166015625, -0.4067955017089844, -0.39342498779296875, -0.3800544738769531, -0.3666839599609375, -0.3533134460449219, -0.33994293212890625, -0.3265724182128906, -0.313201904296875, -0.2998313903808594, -0.28646087646484375, -0.2730903625488281, -0.2597198486328125, -0.24634933471679688, -0.23297882080078125, -0.21960830688476562, -0.20623779296875, -0.19286727905273438, -0.17949676513671875, -0.16612625122070312, -0.1527557373046875, -0.13938522338867188, -0.12601470947265625, -0.11264419555664062, -0.099273681640625, -0.08590316772460938, -0.07253265380859375, -0.059162139892578125, -0.0457916259765625, -0.032421112060546875, -0.01905059814453125, -0.005680084228515625, 0.0076904296875, 0.021060943603515625, 0.03443145751953125, 0.047801971435546875, 0.0611724853515625, 0.07454299926757812, 0.08791351318359375, 0.10128402709960938, 0.114654541015625, 0.12802505493164062, 0.14139556884765625, 0.15476608276367188, 0.1681365966796875, 0.18150711059570312, 0.19487762451171875, 0.20824813842773438, 0.22161865234375, 0.23498916625976562, 0.24835968017578125, 0.2617301940917969, 0.2751007080078125, 0.2884712219238281, 0.30184173583984375, 0.3152122497558594, 0.328582763671875, 0.3419532775878906, 0.35532379150390625, 0.3686943054199219, 0.3820648193359375, 0.3954353332519531, 0.40880584716796875, 0.4221763610839844, 0.435546875]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 3.0, 1.0, 4.0, 4.0, 3.0, 6.0, 5.0, 7.0, 4.0, 10.0, 11.0, 12.0, 19.0, 24.0, 29.0, 28.0, 46.0, 47.0, 50.0, 52.0, 64.0, 86.0, 74.0, 67.0, 52.0, 56.0, 35.0, 31.0, 25.0, 24.0, 27.0, 15.0, 15.0, 12.0, 7.0, 7.0, 5.0, 4.0, 6.0, 7.0, 8.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0], "bins": [-0.005229949951171875, -0.005082249641418457, -0.004934549331665039, -0.004786849021911621, -0.004639148712158203, -0.004491448402404785, -0.004343748092651367, -0.004196047782897949, -0.004048347473144531, -0.0039006471633911133, -0.0037529468536376953, -0.0036052465438842773, -0.0034575462341308594, -0.0033098459243774414, -0.0031621456146240234, -0.0030144453048706055, -0.0028667449951171875, -0.0027190446853637695, -0.0025713443756103516, -0.0024236440658569336, -0.0022759437561035156, -0.0021282434463500977, -0.0019805431365966797, -0.0018328428268432617, -0.0016851425170898438, -0.0015374422073364258, -0.0013897418975830078, -0.0012420415878295898, -0.0010943412780761719, -0.0009466409683227539, -0.0007989406585693359, -0.000651240348815918, -0.0005035400390625, -0.00035583972930908203, -0.00020813941955566406, -6.0439109802246094e-05, 8.726119995117188e-05, 0.00023496150970458984, 0.0003826618194580078, 0.0005303621292114258, 0.0006780624389648438, 0.0008257627487182617, 0.0009734630584716797, 0.0011211633682250977, 0.0012688636779785156, 0.0014165639877319336, 0.0015642642974853516, 0.0017119646072387695, 0.0018596649169921875, 0.0020073652267456055, 0.0021550655364990234, 0.0023027658462524414, 0.0024504661560058594, 0.0025981664657592773, 0.0027458667755126953, 0.0028935670852661133, 0.0030412673950195312, 0.0031889677047729492, 0.003336668014526367, 0.003484368324279785, 0.003632068634033203, 0.003779768943786621, 0.003927469253540039, 0.004075169563293457, 0.004222869873046875]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 6.0, 3.0, 2.0, 6.0, 10.0, 6.0, 3.0, 4.0, 11.0, 21.0, 29.0, 38.0, 55.0, 63.0, 71.0, 105.0, 182.0, 289.0, 599.0, 4284.0, 990878.0, 49860.0, 895.0, 413.0, 225.0, 143.0, 99.0, 70.0, 49.0, 35.0, 18.0, 18.0, 14.0, 4.0, 6.0, 6.0, 11.0, 2.0, 3.0, 4.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.09002685546875, -0.08699798583984375, -0.0839691162109375, -0.08094024658203125, -0.077911376953125, -0.07488250732421875, -0.0718536376953125, -0.06882476806640625, -0.0657958984375, -0.06276702880859375, -0.0597381591796875, -0.05670928955078125, -0.053680419921875, -0.05065155029296875, -0.0476226806640625, -0.04459381103515625, -0.04156494140625, -0.03853607177734375, -0.0355072021484375, -0.03247833251953125, -0.029449462890625, -0.02642059326171875, -0.0233917236328125, -0.02036285400390625, -0.017333984375, -0.01430511474609375, -0.0112762451171875, -0.00824737548828125, -0.005218505859375, -0.00218963623046875, 0.0008392333984375, 0.00386810302734375, 0.00689697265625, 0.00992584228515625, 0.0129547119140625, 0.01598358154296875, 0.019012451171875, 0.02204132080078125, 0.0250701904296875, 0.02809906005859375, 0.0311279296875, 0.03415679931640625, 0.0371856689453125, 0.04021453857421875, 0.043243408203125, 0.04627227783203125, 0.0493011474609375, 0.05233001708984375, 0.05535888671875, 0.05838775634765625, 0.0614166259765625, 0.06444549560546875, 0.067474365234375, 0.07050323486328125, 0.0735321044921875, 0.07656097412109375, 0.07958984375, 0.08261871337890625, 0.0856475830078125, 0.08867645263671875, 0.091705322265625, 0.09473419189453125, 0.0977630615234375, 0.10079193115234375, 0.10382080078125]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 7.0, 165.0, 762.0, 71.0, 9.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00869666412472725, -0.007854385301470757, -0.007012106012552977, -0.006169827189296484, -0.005327547900378704, -0.0044852690771222115, -0.003642990253865719, -0.002800710964947939, -0.0019584321416914463, -0.00111615308560431, -0.0002738741459324956, 0.0005684047937393188, 0.0014106838498264551, 0.0022529629059135914, 0.003095241729170084, 0.003937521018087864, 0.0047797998413443565, 0.005622078664600849, 0.006464357953518629, 0.007306636776775122, 0.008148916065692902, 0.008991194888949394, 0.009833473712205887, 0.01067575253546238, 0.011518031358718872, 0.012360310181975365, 0.013202589005231857, 0.01404486782848835, 0.014887147583067417, 0.015729427337646484, 0.016571704298257828, 0.01741398498415947, 0.018256263807415962, 0.019098542630672455, 0.019940821453928947, 0.02078310027718544, 0.021625379100441933, 0.022467657923698425, 0.023309938609600067, 0.02415221743285656, 0.024994496256113052, 0.025836775079369545, 0.026679053902626038, 0.02752133272588253, 0.028363611549139023, 0.029205892235040665, 0.030048169195652008, 0.03089044988155365, 0.03173272684216499, 0.032575007528066635, 0.03341728448867798, 0.03425956517457962, 0.035101842135190964, 0.035944122821092606, 0.03678639978170395, 0.03762868046760559, 0.03847096115350723, 0.039313241839408875, 0.04015551880002022, 0.04099779948592186, 0.0418400764465332, 0.042682357132434845, 0.04352463409304619, 0.04436691477894783, 0.045209191739559174]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 2.0, 2.0, 6.0, 4.0, 9.0, 13.0, 15.0, 23.0, 19.0, 32.0, 42.0, 43.0, 42.0, 53.0, 51.0, 64.0, 52.0, 47.0, 51.0, 56.0, 64.0, 36.0, 55.0, 41.0, 38.0, 25.0, 34.0, 21.0, 18.0, 12.0, 13.0, 7.0, 8.0, 2.0, 3.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004752993583679199, -0.004619834013283253, -0.004486674442887306, -0.00435351487249136, -0.004220355302095413, -0.004087195731699467, -0.00395403616130352, -0.0038208765909075737, -0.003687717020511627, -0.0035545574501156807, -0.003421397879719734, -0.0032882383093237877, -0.003155078738927841, -0.0030219191685318947, -0.002888759598135948, -0.0027556000277400017, -0.002622440457344055, -0.0024892808869481087, -0.002356121316552162, -0.0022229617461562157, -0.002089802175760269, -0.0019566426053643227, -0.0018234830349683762, -0.0016903234645724297, -0.0015571638941764832, -0.0014240043237805367, -0.0012908447533845901, -0.0011576851829886436, -0.0010245256125926971, -0.0008913660421967506, -0.0007582064718008041, -0.0006250469014048576, -0.0004918873310089111, -0.00035872776061296463, -0.00022556819021701813, -9.240861982107162e-05, 4.075095057487488e-05, 0.00017391052097082138, 0.0003070700913667679, 0.0004402296617627144, 0.0005733892321586609, 0.0007065488025546074, 0.0008397083729505539, 0.0009728679433465004, 0.001106027513742447, 0.0012391870841383934, 0.00137234665453434, 0.0015055062249302864, 0.001638665795326233, 0.0017718253657221794, 0.001904984936118126, 0.0020381445065140724, 0.002171304076910019, 0.0023044636473059654, 0.002437623217701912, 0.0025707827880978584, 0.002703942358493805, 0.0028371019288897514, 0.002970261499285698, 0.0031034210696816444, 0.003236580640077591, 0.0033697402104735374, 0.003502899780869484, 0.0036360593512654305, 0.003769218921661377]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 6.0, 7.0, 6.0, 9.0, 9.0, 11.0, 13.0, 11.0, 16.0, 17.0, 18.0, 27.0, 25.0, 35.0, 26.0, 29.0, 40.0, 23.0, 40.0, 34.0, 32.0, 35.0, 43.0, 34.0, 44.0, 24.0, 29.0, 36.0, 31.0, 43.0, 32.0, 18.0, 25.0, 20.0, 18.0, 25.0, 20.0, 12.0, 11.0, 13.0, 10.0, 9.0, 12.0, 6.0, 5.0, 8.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0], "bins": [-4.82421875, -4.66900634765625, -4.5137939453125, -4.35858154296875, -4.203369140625, -4.04815673828125, -3.8929443359375, -3.73773193359375, -3.58251953125, -3.42730712890625, -3.2720947265625, -3.11688232421875, -2.961669921875, -2.80645751953125, -2.6512451171875, -2.49603271484375, -2.3408203125, -2.18560791015625, -2.0303955078125, -1.87518310546875, -1.719970703125, -1.56475830078125, -1.4095458984375, -1.25433349609375, -1.09912109375, -0.94390869140625, -0.7886962890625, -0.63348388671875, -0.478271484375, -0.32305908203125, -0.1678466796875, -0.01263427734375, 0.142578125, 0.29779052734375, 0.4530029296875, 0.60821533203125, 0.763427734375, 0.91864013671875, 1.0738525390625, 1.22906494140625, 1.38427734375, 1.53948974609375, 1.6947021484375, 1.84991455078125, 2.005126953125, 2.16033935546875, 2.3155517578125, 2.47076416015625, 2.6259765625, 2.78118896484375, 2.9364013671875, 3.09161376953125, 3.246826171875, 3.40203857421875, 3.5572509765625, 3.71246337890625, 3.86767578125, 4.02288818359375, 4.1781005859375, 4.33331298828125, 4.488525390625, 4.64373779296875, 4.7989501953125, 4.95416259765625, 5.109375]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 9.0, 3.0, 2.0, 9.0, 11.0, 21.0, 37.0, 38.0, 54.0, 104.0, 178.0, 280.0, 424.0, 625.0, 1100.0, 1748.0, 2775.0, 4643.0, 8018.0, 13800.0, 25276.0, 52256.0, 147238.0, 443603.0, 209615.0, 66886.0, 30397.0, 16296.0, 9358.0, 5364.0, 3232.0, 1940.0, 1187.0, 749.0, 435.0, 314.0, 188.0, 127.0, 69.0, 48.0, 37.0, 29.0, 23.0, 13.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.580078125, -3.4669189453125, -3.353759765625, -3.2406005859375, -3.12744140625, -3.0142822265625, -2.901123046875, -2.7879638671875, -2.6748046875, -2.5616455078125, -2.448486328125, -2.3353271484375, -2.22216796875, -2.1090087890625, -1.995849609375, -1.8826904296875, -1.76953125, -1.6563720703125, -1.543212890625, -1.4300537109375, -1.31689453125, -1.2037353515625, -1.090576171875, -0.9774169921875, -0.8642578125, -0.7510986328125, -0.637939453125, -0.5247802734375, -0.41162109375, -0.2984619140625, -0.185302734375, -0.0721435546875, 0.041015625, 0.1541748046875, 0.267333984375, 0.3804931640625, 0.49365234375, 0.6068115234375, 0.719970703125, 0.8331298828125, 0.9462890625, 1.0594482421875, 1.172607421875, 1.2857666015625, 1.39892578125, 1.5120849609375, 1.625244140625, 1.7384033203125, 1.8515625, 1.9647216796875, 2.077880859375, 2.1910400390625, 2.30419921875, 2.4173583984375, 2.530517578125, 2.6436767578125, 2.7568359375, 2.8699951171875, 2.983154296875, 3.0963134765625, 3.20947265625, 3.3226318359375, 3.435791015625, 3.5489501953125, 3.662109375]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 7.0, 6.0, 4.0, 5.0, 7.0, 9.0, 10.0, 8.0, 19.0, 12.0, 18.0, 29.0, 29.0, 32.0, 29.0, 33.0, 49.0, 46.0, 64.0, 129.0, 1681.0, 304.0, 95.0, 58.0, 40.0, 46.0, 46.0, 32.0, 34.0, 29.0, 24.0, 31.0, 19.0, 17.0, 9.0, 16.0, 8.0, 3.0, 2.0, 6.0, 4.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.359375, -17.674560546875, -16.98974609375, -16.304931640625, -15.6201171875, -14.935302734375, -14.25048828125, -13.565673828125, -12.880859375, -12.196044921875, -11.51123046875, -10.826416015625, -10.1416015625, -9.456787109375, -8.77197265625, -8.087158203125, -7.40234375, -6.717529296875, -6.03271484375, -5.347900390625, -4.6630859375, -3.978271484375, -3.29345703125, -2.608642578125, -1.923828125, -1.239013671875, -0.55419921875, 0.130615234375, 0.8154296875, 1.500244140625, 2.18505859375, 2.869873046875, 3.5546875, 4.239501953125, 4.92431640625, 5.609130859375, 6.2939453125, 6.978759765625, 7.66357421875, 8.348388671875, 9.033203125, 9.718017578125, 10.40283203125, 11.087646484375, 11.7724609375, 12.457275390625, 13.14208984375, 13.826904296875, 14.51171875, 15.196533203125, 15.88134765625, 16.566162109375, 17.2509765625, 17.935791015625, 18.62060546875, 19.305419921875, 19.990234375, 20.675048828125, 21.35986328125, 22.044677734375, 22.7294921875, 23.414306640625, 24.09912109375, 24.783935546875, 25.46875]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 2.0, 6.0, 13.0, 12.0, 17.0, 18.0, 26.0, 43.0, 49.0, 63.0, 87.0, 108.0, 218.0, 401.0, 1089.0, 19032.0, 3106433.0, 16107.0, 973.0, 377.0, 210.0, 120.0, 85.0, 49.0, 37.0, 32.0, 23.0, 19.0, 18.0, 13.0, 9.0, 6.0, 1.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-67.1875, -65.39501953125, -63.6025390625, -61.81005859375, -60.017578125, -58.22509765625, -56.4326171875, -54.64013671875, -52.84765625, -51.05517578125, -49.2626953125, -47.47021484375, -45.677734375, -43.88525390625, -42.0927734375, -40.30029296875, -38.5078125, -36.71533203125, -34.9228515625, -33.13037109375, -31.337890625, -29.54541015625, -27.7529296875, -25.96044921875, -24.16796875, -22.37548828125, -20.5830078125, -18.79052734375, -16.998046875, -15.20556640625, -13.4130859375, -11.62060546875, -9.828125, -8.03564453125, -6.2431640625, -4.45068359375, -2.658203125, -0.86572265625, 0.9267578125, 2.71923828125, 4.51171875, 6.30419921875, 8.0966796875, 9.88916015625, 11.681640625, 13.47412109375, 15.2666015625, 17.05908203125, 18.8515625, 20.64404296875, 22.4365234375, 24.22900390625, 26.021484375, 27.81396484375, 29.6064453125, 31.39892578125, 33.19140625, 34.98388671875, 36.7763671875, 38.56884765625, 40.361328125, 42.15380859375, 43.9462890625, 45.73876953125, 47.53125]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 7.0, 2.0, 14.0, 35.0, 59.0, 101.0, 152.0, 187.0, 168.0, 145.0, 75.0, 40.0, 22.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.403079986572266, -46.38817596435547, -45.373268127441406, -44.35836410522461, -43.34346008300781, -42.32855224609375, -41.31364822387695, -40.298744201660156, -39.283836364746094, -38.2689323425293, -37.254024505615234, -36.23912048339844, -35.22421646118164, -34.209312438964844, -33.19440460205078, -32.179500579833984, -31.164596557617188, -30.149690628051758, -29.13478660583496, -28.11988067626953, -27.104976654052734, -26.090070724487305, -25.075164794921875, -24.060260772705078, -23.04535484313965, -22.03044891357422, -21.015544891357422, -20.000638961791992, -18.985733032226562, -17.970829010009766, -16.955923080444336, -15.941018104553223, -14.926109313964844, -13.91120433807373, -12.896299362182617, -11.881393432617188, -10.866488456726074, -9.851583480834961, -8.836677551269531, -7.821772575378418, -6.806867599487305, -5.791962623596191, -4.77705717086792, -3.7621519565582275, -2.747246742248535, -1.7323417663574219, -0.7174363136291504, 0.2974691390991211, 1.3123741149902344, 2.3272793292999268, 3.342184543609619, 4.357089996337891, 5.371994972229004, 6.386899948120117, 7.401805400848389, 8.41671085357666, 9.431615829467773, 10.446520805358887, 11.46142578125, 12.47633171081543, 13.491236686706543, 14.506141662597656, 15.521047592163086, 16.535953521728516, 17.550857543945312]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 3.0, 9.0, 4.0, 11.0, 6.0, 18.0, 15.0, 16.0, 24.0, 20.0, 25.0, 25.0, 25.0, 34.0, 40.0, 35.0, 35.0, 45.0, 24.0, 46.0, 43.0, 40.0, 36.0, 55.0, 29.0, 47.0, 35.0, 34.0, 27.0, 27.0, 21.0, 32.0, 16.0, 17.0, 8.0, 17.0, 15.0, 9.0, 6.0, 10.0, 5.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-49.996826171875, -48.29018783569336, -46.58354568481445, -44.87690734863281, -43.170265197753906, -41.463626861572266, -39.756988525390625, -38.05034637451172, -36.34370803833008, -34.63706970214844, -32.93042755126953, -31.22378921508789, -29.517148971557617, -27.810508728027344, -26.10386848449707, -24.397228240966797, -22.690587997436523, -20.98394775390625, -19.277307510375977, -17.570667266845703, -15.864028930664062, -14.157388687133789, -12.450748443603516, -10.744109153747559, -9.037468910217285, -7.33082914352417, -5.624189376831055, -3.9175491333007812, -2.210909366607666, -0.5042695999145508, 1.2023706436157227, 2.9090099334716797, 4.615650177001953, 6.322289943695068, 8.028929710388184, 9.735569953918457, 11.442209243774414, 13.148849487304688, 14.855489730834961, 16.562129974365234, 18.268768310546875, 19.97540855407715, 21.682048797607422, 23.388687133789062, 25.095327377319336, 26.80196762084961, 28.508607864379883, 30.215248107910156, 31.92188835144043, 33.6285285949707, 35.335166931152344, 37.04180908203125, 38.74844741821289, 40.45508575439453, 42.16172790527344, 43.86836624145508, 45.575008392333984, 47.281646728515625, 48.98828887939453, 50.69492721557617, 52.40156936645508, 54.10820770263672, 55.814849853515625, 57.521488189697266, 59.228126525878906]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 4.0, 5.0, 13.0, 10.0, 7.0, 8.0, 11.0, 16.0, 9.0, 15.0, 20.0, 26.0, 41.0, 30.0, 34.0, 33.0, 26.0, 23.0, 32.0, 35.0, 33.0, 49.0, 39.0, 39.0, 38.0, 27.0, 36.0, 32.0, 32.0, 35.0, 26.0, 28.0, 23.0, 20.0, 25.0, 18.0, 9.0, 19.0, 13.0, 14.0, 8.0, 10.0, 7.0, 6.0, 3.0, 8.0, 5.0, 3.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.92578125, -4.7607421875, -4.595703125, -4.4306640625, -4.265625, -4.1005859375, -3.935546875, -3.7705078125, -3.60546875, -3.4404296875, -3.275390625, -3.1103515625, -2.9453125, -2.7802734375, -2.615234375, -2.4501953125, -2.28515625, -2.1201171875, -1.955078125, -1.7900390625, -1.625, -1.4599609375, -1.294921875, -1.1298828125, -0.96484375, -0.7998046875, -0.634765625, -0.4697265625, -0.3046875, -0.1396484375, 0.025390625, 0.1904296875, 0.35546875, 0.5205078125, 0.685546875, 0.8505859375, 1.015625, 1.1806640625, 1.345703125, 1.5107421875, 1.67578125, 1.8408203125, 2.005859375, 2.1708984375, 2.3359375, 2.5009765625, 2.666015625, 2.8310546875, 2.99609375, 3.1611328125, 3.326171875, 3.4912109375, 3.65625, 3.8212890625, 3.986328125, 4.1513671875, 4.31640625, 4.4814453125, 4.646484375, 4.8115234375, 4.9765625, 5.1416015625, 5.306640625, 5.4716796875, 5.63671875]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 7.0, 4.0, 12.0, 14.0, 14.0, 19.0, 31.0, 64.0, 59.0, 100.0, 154.0, 215.0, 326.0, 573.0, 1010.0, 1970.0, 4168.0, 10138.0, 30960.0, 128332.0, 675938.0, 1841519.0, 1180792.0, 241944.0, 49560.0, 14997.0, 5709.0, 2466.0, 1262.0, 699.0, 384.0, 255.0, 172.0, 120.0, 82.0, 47.0, 33.0, 29.0, 29.0, 23.0, 19.0, 13.0, 8.0, 7.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-9.171875, -8.891357421875, -8.61083984375, -8.330322265625, -8.0498046875, -7.769287109375, -7.48876953125, -7.208251953125, -6.927734375, -6.647216796875, -6.36669921875, -6.086181640625, -5.8056640625, -5.525146484375, -5.24462890625, -4.964111328125, -4.68359375, -4.403076171875, -4.12255859375, -3.842041015625, -3.5615234375, -3.281005859375, -3.00048828125, -2.719970703125, -2.439453125, -2.158935546875, -1.87841796875, -1.597900390625, -1.3173828125, -1.036865234375, -0.75634765625, -0.475830078125, -0.1953125, 0.085205078125, 0.36572265625, 0.646240234375, 0.9267578125, 1.207275390625, 1.48779296875, 1.768310546875, 2.048828125, 2.329345703125, 2.60986328125, 2.890380859375, 3.1708984375, 3.451416015625, 3.73193359375, 4.012451171875, 4.29296875, 4.573486328125, 4.85400390625, 5.134521484375, 5.4150390625, 5.695556640625, 5.97607421875, 6.256591796875, 6.537109375, 6.817626953125, 7.09814453125, 7.378662109375, 7.6591796875, 7.939697265625, 8.22021484375, 8.500732421875, 8.78125]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 6.0, 7.0, 6.0, 10.0, 20.0, 16.0, 18.0, 23.0, 23.0, 54.0, 60.0, 78.0, 106.0, 144.0, 200.0, 216.0, 338.0, 386.0, 412.0, 431.0, 328.0, 311.0, 188.0, 176.0, 128.0, 103.0, 66.0, 59.0, 28.0, 43.0, 30.0, 19.0, 11.0, 11.0, 11.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.3515625, -9.979736328125, -9.60791015625, -9.236083984375, -8.8642578125, -8.492431640625, -8.12060546875, -7.748779296875, -7.376953125, -7.005126953125, -6.63330078125, -6.261474609375, -5.8896484375, -5.517822265625, -5.14599609375, -4.774169921875, -4.40234375, -4.030517578125, -3.65869140625, -3.286865234375, -2.9150390625, -2.543212890625, -2.17138671875, -1.799560546875, -1.427734375, -1.055908203125, -0.68408203125, -0.312255859375, 0.0595703125, 0.431396484375, 0.80322265625, 1.175048828125, 1.546875, 1.918701171875, 2.29052734375, 2.662353515625, 3.0341796875, 3.406005859375, 3.77783203125, 4.149658203125, 4.521484375, 4.893310546875, 5.26513671875, 5.636962890625, 6.0087890625, 6.380615234375, 6.75244140625, 7.124267578125, 7.49609375, 7.867919921875, 8.23974609375, 8.611572265625, 8.9833984375, 9.355224609375, 9.72705078125, 10.098876953125, 10.470703125, 10.842529296875, 11.21435546875, 11.586181640625, 11.9580078125, 12.329833984375, 12.70166015625, 13.073486328125, 13.4453125]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 8.0, 2.0, 2.0, 12.0, 9.0, 6.0, 15.0, 18.0, 19.0, 23.0, 27.0, 47.0, 68.0, 71.0, 100.0, 146.0, 214.0, 393.0, 1128.0, 5364.0, 91694.0, 3452386.0, 621605.0, 17212.0, 2115.0, 573.0, 311.0, 182.0, 106.0, 102.0, 66.0, 69.0, 45.0, 34.0, 26.0, 18.0, 13.0, 10.0, 13.0, 8.0, 7.0, 6.0, 6.0, 7.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0], "bins": [-40.15625, -39.03271484375, -37.9091796875, -36.78564453125, -35.662109375, -34.53857421875, -33.4150390625, -32.29150390625, -31.16796875, -30.04443359375, -28.9208984375, -27.79736328125, -26.673828125, -25.55029296875, -24.4267578125, -23.30322265625, -22.1796875, -21.05615234375, -19.9326171875, -18.80908203125, -17.685546875, -16.56201171875, -15.4384765625, -14.31494140625, -13.19140625, -12.06787109375, -10.9443359375, -9.82080078125, -8.697265625, -7.57373046875, -6.4501953125, -5.32666015625, -4.203125, -3.07958984375, -1.9560546875, -0.83251953125, 0.291015625, 1.41455078125, 2.5380859375, 3.66162109375, 4.78515625, 5.90869140625, 7.0322265625, 8.15576171875, 9.279296875, 10.40283203125, 11.5263671875, 12.64990234375, 13.7734375, 14.89697265625, 16.0205078125, 17.14404296875, 18.267578125, 19.39111328125, 20.5146484375, 21.63818359375, 22.76171875, 23.88525390625, 25.0087890625, 26.13232421875, 27.255859375, 28.37939453125, 29.5029296875, 30.62646484375, 31.75]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 8.0, 18.0, 25.0, 42.0, 107.0, 138.0, 162.0, 192.0, 132.0, 92.0, 50.0, 27.0, 15.0, 7.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-94.44627380371094, -91.58157348632812, -88.71688079833984, -85.85218048095703, -82.98748779296875, -80.12278747558594, -77.25808715820312, -74.39339447021484, -71.52870178222656, -68.66400146484375, -65.79930877685547, -62.934608459472656, -60.069915771484375, -57.20521545410156, -54.340518951416016, -51.47582244873047, -48.611122131347656, -45.74642562866211, -42.88172912597656, -40.01702880859375, -37.15233612060547, -34.287635803222656, -31.42293930053711, -28.558242797851562, -25.693546295166016, -22.82884979248047, -19.964153289794922, -17.099454879760742, -14.234758377075195, -11.370061874389648, -8.505363464355469, -5.640666961669922, -2.7759628295898438, 0.08873414993286133, 2.9534311294555664, 5.81812858581543, 8.682825088500977, 11.547521591186523, 14.412220001220703, 17.27691650390625, 20.141613006591797, 23.006309509277344, 25.87100601196289, 28.73570442199707, 31.600400924682617, 34.46509552001953, 37.329795837402344, 40.19449234008789, 43.05918884277344, 45.923885345458984, 48.78858184814453, 51.653282165527344, 54.517974853515625, 57.38267517089844, 60.247371673583984, 63.11206817626953, 65.97676086425781, 68.84146118164062, 71.7061538696289, 74.57085418701172, 77.435546875, 80.30024719238281, 83.16494750976562, 86.0296401977539, 88.89434051513672]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 5.0, 3.0, 6.0, 12.0, 7.0, 6.0, 13.0, 14.0, 17.0, 18.0, 22.0, 34.0, 31.0, 25.0, 37.0, 32.0, 38.0, 35.0, 54.0, 35.0, 50.0, 43.0, 32.0, 28.0, 33.0, 39.0, 38.0, 34.0, 31.0, 38.0, 22.0, 23.0, 27.0, 13.0, 17.0, 22.0, 13.0, 12.0, 15.0, 14.0, 7.0, 3.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 4.0], "bins": [-44.685394287109375, -43.43315124511719, -42.180912017822266, -40.92866897583008, -39.676429748535156, -38.42418670654297, -37.17194366455078, -35.91970443725586, -34.66746139526367, -33.415218353271484, -32.16297912597656, -30.910736083984375, -29.65849494934082, -28.406253814697266, -27.15401268005371, -25.901771545410156, -24.6495304107666, -23.397289276123047, -22.145048141479492, -20.892807006835938, -19.64056396484375, -18.388322830200195, -17.13608169555664, -15.88383960723877, -14.631598472595215, -13.37935733795166, -12.127115249633789, -10.874874114990234, -9.62263298034668, -8.370390892028809, -7.118149757385254, -5.865907669067383, -4.613666534423828, -3.3614249229431152, -2.1091835498809814, -0.8569421768188477, 0.39529943466186523, 1.6475410461425781, 2.899782180786133, 4.152024269104004, 5.404265403747559, 6.6565070152282715, 7.908748626708984, 9.160989761352539, 10.413230895996094, 11.665472984313965, 12.91771411895752, 14.16995620727539, 15.422197341918945, 16.6744384765625, 17.926679611206055, 19.17892074584961, 20.431163787841797, 21.68340492248535, 22.935646057128906, 24.187889099121094, 25.440128326416016, 26.69236946105957, 27.944610595703125, 29.196853637695312, 30.449094772338867, 31.701335906982422, 32.953575134277344, 34.20581817626953, 35.45806121826172]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 4.0, 6.0, 6.0, 9.0, 10.0, 13.0, 14.0, 22.0, 20.0, 24.0, 30.0, 25.0, 23.0, 40.0, 30.0, 39.0, 31.0, 48.0, 37.0, 57.0, 48.0, 39.0, 37.0, 26.0, 48.0, 31.0, 38.0, 35.0, 34.0, 30.0, 28.0, 22.0, 17.0, 12.0, 13.0, 16.0, 11.0, 8.0, 6.0, 4.0, 6.0, 5.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.50390625, -5.31805419921875, -5.1322021484375, -4.94635009765625, -4.760498046875, -4.57464599609375, -4.3887939453125, -4.20294189453125, -4.01708984375, -3.83123779296875, -3.6453857421875, -3.45953369140625, -3.273681640625, -3.08782958984375, -2.9019775390625, -2.71612548828125, -2.5302734375, -2.34442138671875, -2.1585693359375, -1.97271728515625, -1.786865234375, -1.60101318359375, -1.4151611328125, -1.22930908203125, -1.04345703125, -0.85760498046875, -0.6717529296875, -0.48590087890625, -0.300048828125, -0.11419677734375, 0.0716552734375, 0.25750732421875, 0.443359375, 0.62921142578125, 0.8150634765625, 1.00091552734375, 1.186767578125, 1.37261962890625, 1.5584716796875, 1.74432373046875, 1.93017578125, 2.11602783203125, 2.3018798828125, 2.48773193359375, 2.673583984375, 2.85943603515625, 3.0452880859375, 3.23114013671875, 3.4169921875, 3.60284423828125, 3.7886962890625, 3.97454833984375, 4.160400390625, 4.34625244140625, 4.5321044921875, 4.71795654296875, 4.90380859375, 5.08966064453125, 5.2755126953125, 5.46136474609375, 5.647216796875, 5.83306884765625, 6.0189208984375, 6.20477294921875, 6.390625]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 7.0, 3.0, 9.0, 9.0, 8.0, 28.0, 39.0, 65.0, 88.0, 137.0, 193.0, 336.0, 483.0, 722.0, 1060.0, 1651.0, 2494.0, 3855.0, 6064.0, 9302.0, 14522.0, 23202.0, 35901.0, 56899.0, 88645.0, 132188.0, 173355.0, 163855.0, 118451.0, 77679.0, 49606.0, 31397.0, 20249.0, 12904.0, 8124.0, 5314.0, 3309.0, 2267.0, 1438.0, 892.0, 593.0, 429.0, 259.0, 184.0, 115.0, 70.0, 52.0, 36.0, 35.0, 18.0, 13.0, 9.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.5703125, -0.5524063110351562, -0.5345001220703125, -0.5165939331054688, -0.498687744140625, -0.48078155517578125, -0.4628753662109375, -0.44496917724609375, -0.42706298828125, -0.40915679931640625, -0.3912506103515625, -0.37334442138671875, -0.355438232421875, -0.33753204345703125, -0.3196258544921875, -0.30171966552734375, -0.2838134765625, -0.26590728759765625, -0.2480010986328125, -0.23009490966796875, -0.212188720703125, -0.19428253173828125, -0.1763763427734375, -0.15847015380859375, -0.14056396484375, -0.12265777587890625, -0.1047515869140625, -0.08684539794921875, -0.068939208984375, -0.05103302001953125, -0.0331268310546875, -0.01522064208984375, 0.002685546875, 0.02059173583984375, 0.0384979248046875, 0.05640411376953125, 0.074310302734375, 0.09221649169921875, 0.1101226806640625, 0.12802886962890625, 0.14593505859375, 0.16384124755859375, 0.1817474365234375, 0.19965362548828125, 0.217559814453125, 0.23546600341796875, 0.2533721923828125, 0.27127838134765625, 0.2891845703125, 0.30709075927734375, 0.3249969482421875, 0.34290313720703125, 0.360809326171875, 0.37871551513671875, 0.3966217041015625, 0.41452789306640625, 0.43243408203125, 0.45034027099609375, 0.4682464599609375, 0.48615264892578125, 0.504058837890625, 0.5219650268554688, 0.5398712158203125, 0.5577774047851562, 0.57568359375]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 8.0, 4.0, 5.0, 5.0, 7.0, 13.0, 15.0, 11.0, 25.0, 27.0, 36.0, 37.0, 24.0, 48.0, 42.0, 48.0, 41.0, 35.0, 48.0, 1074.0, 44.0, 55.0, 45.0, 52.0, 35.0, 43.0, 31.0, 35.0, 23.0, 17.0, 17.0, 17.0, 18.0, 16.0, 8.0, 6.0, 4.0, 5.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.91015625, -3.7744140625, -3.638671875, -3.5029296875, -3.3671875, -3.2314453125, -3.095703125, -2.9599609375, -2.82421875, -2.6884765625, -2.552734375, -2.4169921875, -2.28125, -2.1455078125, -2.009765625, -1.8740234375, -1.73828125, -1.6025390625, -1.466796875, -1.3310546875, -1.1953125, -1.0595703125, -0.923828125, -0.7880859375, -0.65234375, -0.5166015625, -0.380859375, -0.2451171875, -0.109375, 0.0263671875, 0.162109375, 0.2978515625, 0.43359375, 0.5693359375, 0.705078125, 0.8408203125, 0.9765625, 1.1123046875, 1.248046875, 1.3837890625, 1.51953125, 1.6552734375, 1.791015625, 1.9267578125, 2.0625, 2.1982421875, 2.333984375, 2.4697265625, 2.60546875, 2.7412109375, 2.876953125, 3.0126953125, 3.1484375, 3.2841796875, 3.419921875, 3.5556640625, 3.69140625, 3.8271484375, 3.962890625, 4.0986328125, 4.234375, 4.3701171875, 4.505859375, 4.6416015625, 4.77734375]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 4.0, 14.0, 15.0, 23.0, 34.0, 49.0, 82.0, 162.0, 212.0, 396.0, 646.0, 1139.0, 1927.0, 3183.0, 5130.0, 8602.0, 14507.0, 24499.0, 40960.0, 67843.0, 108318.0, 156442.0, 1229716.0, 156428.0, 107360.0, 67558.0, 40941.0, 24308.0, 14851.0, 8730.0, 5288.0, 3131.0, 1861.0, 1128.0, 712.0, 358.0, 234.0, 162.0, 71.0, 37.0, 24.0, 12.0, 18.0, 3.0, 7.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.492919921875, -0.47820281982421875, -0.4634857177734375, -0.44876861572265625, -0.434051513671875, -0.41933441162109375, -0.4046173095703125, -0.38990020751953125, -0.37518310546875, -0.36046600341796875, -0.3457489013671875, -0.33103179931640625, -0.316314697265625, -0.30159759521484375, -0.2868804931640625, -0.27216339111328125, -0.2574462890625, -0.24272918701171875, -0.2280120849609375, -0.21329498291015625, -0.198577880859375, -0.18386077880859375, -0.1691436767578125, -0.15442657470703125, -0.13970947265625, -0.12499237060546875, -0.1102752685546875, -0.09555816650390625, -0.080841064453125, -0.06612396240234375, -0.0514068603515625, -0.03668975830078125, -0.02197265625, -0.00725555419921875, 0.0074615478515625, 0.02217864990234375, 0.036895751953125, 0.05161285400390625, 0.0663299560546875, 0.08104705810546875, 0.09576416015625, 0.11048126220703125, 0.1251983642578125, 0.13991546630859375, 0.154632568359375, 0.16934967041015625, 0.1840667724609375, 0.19878387451171875, 0.2135009765625, 0.22821807861328125, 0.2429351806640625, 0.25765228271484375, 0.272369384765625, 0.28708648681640625, 0.3018035888671875, 0.31652069091796875, 0.33123779296875, 0.34595489501953125, 0.3606719970703125, 0.37538909912109375, 0.390106201171875, 0.40482330322265625, 0.4195404052734375, 0.43425750732421875, 0.448974609375]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 4.0, 13.0, 6.0, 11.0, 20.0, 25.0, 29.0, 39.0, 44.0, 64.0, 81.0, 89.0, 90.0, 98.0, 76.0, 75.0, 58.0, 37.0, 26.0, 27.0, 17.0, 15.0, 9.0, 11.0, 7.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.006439208984375, -0.0062631964683532715, -0.006087183952331543, -0.0059111714363098145, -0.005735158920288086, -0.005559146404266357, -0.005383133888244629, -0.0052071213722229, -0.005031108856201172, -0.004855096340179443, -0.004679083824157715, -0.004503071308135986, -0.004327058792114258, -0.004151046276092529, -0.003975033760070801, -0.0037990212440490723, -0.0036230087280273438, -0.0034469962120056152, -0.0032709836959838867, -0.003094971179962158, -0.0029189586639404297, -0.002742946147918701, -0.0025669336318969727, -0.002390921115875244, -0.0022149085998535156, -0.002038896083831787, -0.0018628835678100586, -0.00168687105178833, -0.0015108585357666016, -0.001334846019744873, -0.0011588335037231445, -0.000982820987701416, -0.0008068084716796875, -0.000630795955657959, -0.00045478343963623047, -0.00027877092361450195, -0.00010275840759277344, 7.325410842895508e-05, 0.0002492666244506836, 0.0004252791404724121, 0.0006012916564941406, 0.0007773041725158691, 0.0009533166885375977, 0.0011293292045593262, 0.0013053417205810547, 0.0014813542366027832, 0.0016573667526245117, 0.0018333792686462402, 0.0020093917846679688, 0.0021854043006896973, 0.0023614168167114258, 0.0025374293327331543, 0.002713441848754883, 0.0028894543647766113, 0.00306546688079834, 0.0032414793968200684, 0.003417491912841797, 0.0035935044288635254, 0.003769516944885254, 0.003945529460906982, 0.004121541976928711, 0.0042975544929504395, 0.004473567008972168, 0.0046495795249938965, 0.004825592041015625]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 1.0, 8.0, 11.0, 15.0, 16.0, 36.0, 53.0, 76.0, 133.0, 225.0, 501.0, 2850.0, 1018335.0, 24836.0, 750.0, 289.0, 144.0, 97.0, 50.0, 40.0, 18.0, 15.0, 9.0, 12.0, 8.0, 4.0, 2.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10888671875, -0.10495376586914062, -0.10102081298828125, -0.09708786010742188, -0.0931549072265625, -0.08922195434570312, -0.08528900146484375, -0.08135604858398438, -0.077423095703125, -0.07349014282226562, -0.06955718994140625, -0.06562423706054688, -0.0616912841796875, -0.057758331298828125, -0.05382537841796875, -0.049892425537109375, -0.04595947265625, -0.042026519775390625, -0.03809356689453125, -0.034160614013671875, -0.0302276611328125, -0.026294708251953125, -0.02236175537109375, -0.018428802490234375, -0.014495849609375, -0.010562896728515625, -0.00662994384765625, -0.002696990966796875, 0.0012359619140625, 0.005168914794921875, 0.00910186767578125, 0.013034820556640625, 0.0169677734375, 0.020900726318359375, 0.02483367919921875, 0.028766632080078125, 0.0326995849609375, 0.036632537841796875, 0.04056549072265625, 0.044498443603515625, 0.048431396484375, 0.052364349365234375, 0.05629730224609375, 0.060230255126953125, 0.0641632080078125, 0.06809616088867188, 0.07202911376953125, 0.07596206665039062, 0.07989501953125, 0.08382797241210938, 0.08776092529296875, 0.09169387817382812, 0.0956268310546875, 0.09955978393554688, 0.10349273681640625, 0.10742568969726562, 0.111358642578125, 0.11529159545898438, 0.11922454833984375, 0.12315750122070312, 0.1270904541015625, 0.13102340698242188, 0.13495635986328125, 0.13888931274414062, 0.142822265625]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [4.0, 48.0, 807.0, 148.0, 10.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0026813577860593796, -0.0016594692133367062, -0.0006375806406140327, 0.00038430793210864067, 0.001406196504831314, 0.0024280850775539875, 0.003449973650276661, 0.004471862222999334, 0.005493750795722008, 0.006515639368444681, 0.007537527941167355, 0.008559416979551315, 0.009581305086612701, 0.010603193193674088, 0.011625082232058048, 0.012646971270442009, 0.013668859377503395, 0.014690747484564781, 0.015712637454271317, 0.016734525561332703, 0.01775641366839409, 0.018778301775455475, 0.01980018988251686, 0.020822079852223396, 0.021843967959284782, 0.02286585606634617, 0.023887746036052704, 0.02490963414311409, 0.025931522250175476, 0.026953410357236862, 0.02797529846429825, 0.028997188434004784, 0.03001907467842102, 0.031040962785482407, 0.03206285089254379, 0.03308473899960518, 0.034106627106666565, 0.03512851893901825, 0.036150407046079636, 0.03717229515314102, 0.03819418326020241, 0.039216071367263794, 0.04023795947432518, 0.041259847581386566, 0.04228173941373825, 0.04330362752079964, 0.04432551562786102, 0.04534740373492241, 0.046369291841983795, 0.04739117994904518, 0.04841306805610657, 0.049434956163167953, 0.05045684427022934, 0.051478736102581024, 0.05250062420964241, 0.053522512316703796, 0.05454440042376518, 0.05556628853082657, 0.056588176637887955, 0.05761006474494934, 0.058631956577301025, 0.05965384468436241, 0.0606757327914238, 0.061697620898485184, 0.06271950900554657]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 10.0, 7.0, 10.0, 15.0, 24.0, 26.0, 24.0, 30.0, 45.0, 42.0, 46.0, 74.0, 80.0, 68.0, 63.0, 69.0, 63.0, 50.0, 46.0, 51.0, 29.0, 28.0, 29.0, 23.0, 16.0, 10.0, 13.0, 7.0, 3.0, 4.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00514751672744751, -0.005015549249947071, -0.004883581772446632, -0.004751614294946194, -0.004619646817445755, -0.004487679339945316, -0.004355711862444878, -0.004223744384944439, -0.004091776907444, -0.0039598094299435616, -0.003827841952443123, -0.003695874474942684, -0.0035639069974422455, -0.003431939519941807, -0.003299972042441368, -0.0031680045649409294, -0.0030360370874404907, -0.002904069609940052, -0.0027721021324396133, -0.0026401346549391747, -0.002508167177438736, -0.0023761996999382973, -0.0022442322224378586, -0.00211226474493742, -0.001980297267436981, -0.0018483297899365425, -0.0017163623124361038, -0.0015843948349356651, -0.0014524273574352264, -0.0013204598799347878, -0.001188492402434349, -0.0010565249249339104, -0.0009245574474334717, -0.000792589969933033, -0.0006606224924325943, -0.0005286550149321556, -0.0003966875374317169, -0.00026472005993127823, -0.00013275258243083954, -7.851049304008484e-07, 0.00013118237257003784, 0.00026314985007047653, 0.0003951173275709152, 0.0005270848050713539, 0.0006590522825717926, 0.0007910197600722313, 0.00092298723757267, 0.0010549547150731087, 0.0011869221925735474, 0.001318889670073986, 0.0014508571475744247, 0.0015828246250748634, 0.0017147921025753021, 0.0018467595800757408, 0.0019787270575761795, 0.002110694535076618, 0.002242662012577057, 0.0023746294900774956, 0.0025065969675779343, 0.002638564445078373, 0.0027705319225788116, 0.0029024994000792503, 0.003034466877579689, 0.0031664343550801277, 0.0032984018325805664]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 4.0, 6.0, 6.0, 9.0, 10.0, 13.0, 14.0, 22.0, 20.0, 24.0, 30.0, 25.0, 23.0, 40.0, 30.0, 39.0, 31.0, 48.0, 37.0, 57.0, 48.0, 39.0, 37.0, 27.0, 47.0, 31.0, 38.0, 35.0, 34.0, 30.0, 28.0, 22.0, 17.0, 12.0, 13.0, 16.0, 11.0, 8.0, 6.0, 4.0, 6.0, 5.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.50390625, -5.31805419921875, -5.1322021484375, -4.94635009765625, -4.760498046875, -4.57464599609375, -4.3887939453125, -4.20294189453125, -4.01708984375, -3.83123779296875, -3.6453857421875, -3.45953369140625, -3.273681640625, -3.08782958984375, -2.9019775390625, -2.71612548828125, -2.5302734375, -2.34442138671875, -2.1585693359375, -1.97271728515625, -1.786865234375, -1.60101318359375, -1.4151611328125, -1.22930908203125, -1.04345703125, -0.85760498046875, -0.6717529296875, -0.48590087890625, -0.300048828125, -0.11419677734375, 0.0716552734375, 0.25750732421875, 0.443359375, 0.62921142578125, 0.8150634765625, 1.00091552734375, 1.186767578125, 1.37261962890625, 1.5584716796875, 1.74432373046875, 1.93017578125, 2.11602783203125, 2.3018798828125, 2.48773193359375, 2.673583984375, 2.85943603515625, 3.0452880859375, 3.23114013671875, 3.4169921875, 3.60284423828125, 3.7886962890625, 3.97454833984375, 4.160400390625, 4.34625244140625, 4.5321044921875, 4.71795654296875, 4.90380859375, 5.08966064453125, 5.2755126953125, 5.46136474609375, 5.647216796875, 5.83306884765625, 6.0189208984375, 6.20477294921875, 6.390625]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 9.0, 14.0, 15.0, 27.0, 34.0, 77.0, 117.0, 209.0, 289.0, 513.0, 922.0, 1688.0, 3437.0, 7373.0, 16888.0, 39932.0, 100964.0, 305161.0, 366589.0, 121406.0, 46459.0, 19404.0, 8679.0, 3902.0, 1952.0, 1035.0, 575.0, 327.0, 175.0, 123.0, 96.0, 63.0, 36.0, 24.0, 16.0, 8.0, 7.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.875, -4.72308349609375, -4.5711669921875, -4.41925048828125, -4.267333984375, -4.11541748046875, -3.9635009765625, -3.81158447265625, -3.65966796875, -3.50775146484375, -3.3558349609375, -3.20391845703125, -3.052001953125, -2.90008544921875, -2.7481689453125, -2.59625244140625, -2.4443359375, -2.29241943359375, -2.1405029296875, -1.98858642578125, -1.836669921875, -1.68475341796875, -1.5328369140625, -1.38092041015625, -1.22900390625, -1.07708740234375, -0.9251708984375, -0.77325439453125, -0.621337890625, -0.46942138671875, -0.3175048828125, -0.16558837890625, -0.013671875, 0.13824462890625, 0.2901611328125, 0.44207763671875, 0.593994140625, 0.74591064453125, 0.8978271484375, 1.04974365234375, 1.20166015625, 1.35357666015625, 1.5054931640625, 1.65740966796875, 1.809326171875, 1.96124267578125, 2.1131591796875, 2.26507568359375, 2.4169921875, 2.56890869140625, 2.7208251953125, 2.87274169921875, 3.024658203125, 3.17657470703125, 3.3284912109375, 3.48040771484375, 3.63232421875, 3.78424072265625, 3.9361572265625, 4.08807373046875, 4.239990234375, 4.39190673828125, 4.5438232421875, 4.69573974609375, 4.84765625]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 0.0, 3.0, 5.0, 0.0, 4.0, 8.0, 6.0, 8.0, 12.0, 16.0, 25.0, 27.0, 18.0, 33.0, 27.0, 36.0, 30.0, 64.0, 58.0, 94.0, 168.0, 1645.0, 269.0, 90.0, 60.0, 47.0, 49.0, 40.0, 29.0, 32.0, 31.0, 17.0, 25.0, 12.0, 14.0, 6.0, 13.0, 11.0, 9.0, 5.0, 6.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-26.34375, -25.584228515625, -24.82470703125, -24.065185546875, -23.3056640625, -22.546142578125, -21.78662109375, -21.027099609375, -20.267578125, -19.508056640625, -18.74853515625, -17.989013671875, -17.2294921875, -16.469970703125, -15.71044921875, -14.950927734375, -14.19140625, -13.431884765625, -12.67236328125, -11.912841796875, -11.1533203125, -10.393798828125, -9.63427734375, -8.874755859375, -8.115234375, -7.355712890625, -6.59619140625, -5.836669921875, -5.0771484375, -4.317626953125, -3.55810546875, -2.798583984375, -2.0390625, -1.279541015625, -0.52001953125, 0.239501953125, 0.9990234375, 1.758544921875, 2.51806640625, 3.277587890625, 4.037109375, 4.796630859375, 5.55615234375, 6.315673828125, 7.0751953125, 7.834716796875, 8.59423828125, 9.353759765625, 10.11328125, 10.872802734375, 11.63232421875, 12.391845703125, 13.1513671875, 13.910888671875, 14.67041015625, 15.429931640625, 16.189453125, 16.948974609375, 17.70849609375, 18.468017578125, 19.2275390625, 19.987060546875, 20.74658203125, 21.506103515625, 22.265625]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 4.0, 4.0, 7.0, 8.0, 14.0, 19.0, 13.0, 15.0, 15.0, 45.0, 38.0, 65.0, 67.0, 109.0, 128.0, 209.0, 261.0, 480.0, 2146.0, 231901.0, 2903542.0, 4781.0, 721.0, 331.0, 213.0, 165.0, 88.0, 67.0, 63.0, 32.0, 41.0, 33.0, 20.0, 22.0, 10.0, 8.0, 8.0, 3.0, 6.0, 1.0, 3.0, 3.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.78125, -48.0732421875, -46.365234375, -44.6572265625, -42.94921875, -41.2412109375, -39.533203125, -37.8251953125, -36.1171875, -34.4091796875, -32.701171875, -30.9931640625, -29.28515625, -27.5771484375, -25.869140625, -24.1611328125, -22.453125, -20.7451171875, -19.037109375, -17.3291015625, -15.62109375, -13.9130859375, -12.205078125, -10.4970703125, -8.7890625, -7.0810546875, -5.373046875, -3.6650390625, -1.95703125, -0.2490234375, 1.458984375, 3.1669921875, 4.875, 6.5830078125, 8.291015625, 9.9990234375, 11.70703125, 13.4150390625, 15.123046875, 16.8310546875, 18.5390625, 20.2470703125, 21.955078125, 23.6630859375, 25.37109375, 27.0791015625, 28.787109375, 30.4951171875, 32.203125, 33.9111328125, 35.619140625, 37.3271484375, 39.03515625, 40.7431640625, 42.451171875, 44.1591796875, 45.8671875, 47.5751953125, 49.283203125, 50.9912109375, 52.69921875, 54.4072265625, 56.115234375, 57.8232421875, 59.53125]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 8.0, 156.0, 584.0, 250.0, 13.0, 6.0], "bins": [-253.69003295898438, -249.50735473632812, -245.32469177246094, -241.1420135498047, -236.9593505859375, -232.77667236328125, -228.59400939941406, -224.4113311767578, -220.22866821289062, -216.04598999023438, -211.8633270263672, -207.68064880371094, -203.49798583984375, -199.3153076171875, -195.1326446533203, -190.94996643066406, -186.76730346679688, -182.58462524414062, -178.40196228027344, -174.2192840576172, -170.03662109375, -165.85394287109375, -161.67127990722656, -157.4886016845703, -153.30592346191406, -149.1232452392578, -144.94058227539062, -140.75790405273438, -136.5752410888672, -132.39256286621094, -128.20989990234375, -124.0272216796875, -119.84456634521484, -115.66189575195312, -111.4792251586914, -107.29655456542969, -103.11388397216797, -98.93121337890625, -94.74853515625, -90.56587219238281, -86.38319396972656, -82.20052337646484, -78.01785278320312, -73.8351821899414, -69.65251159667969, -65.46984100341797, -61.287166595458984, -57.104496002197266, -52.92182922363281, -48.739158630371094, -44.556488037109375, -40.373817443847656, -36.19114685058594, -32.00847625732422, -27.825801849365234, -23.643131256103516, -19.460460662841797, -15.277790069580078, -11.095118522644043, -6.912446975708008, -2.729776382446289, 1.4528942108154297, 5.635566711425781, 9.8182373046875, 14.000907897949219]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 11.0, 1.0, 5.0, 5.0, 7.0, 12.0, 11.0, 7.0, 12.0, 11.0, 17.0, 18.0, 22.0, 20.0, 27.0, 28.0, 27.0, 44.0, 33.0, 46.0, 44.0, 48.0, 48.0, 40.0, 47.0, 44.0, 47.0, 42.0, 40.0, 23.0, 25.0, 33.0, 21.0, 24.0, 17.0, 16.0, 15.0, 15.0, 12.0, 11.0, 8.0, 7.0, 6.0, 2.0, 3.0, 5.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-48.866756439208984, -47.237186431884766, -45.60762023925781, -43.978050231933594, -42.34848403930664, -40.71891403198242, -39.08934783935547, -37.45977783203125, -35.83020782470703, -34.20063781738281, -32.57107162475586, -30.94150161743164, -29.311935424804688, -27.68236541748047, -26.052797317504883, -24.423229217529297, -22.793663024902344, -21.164094924926758, -19.534526824951172, -17.904956817626953, -16.275390625, -14.645821571350098, -13.016252517700195, -11.38668441772461, -9.757116317749023, -8.127548217773438, -6.497979640960693, -4.868411064147949, -3.2388429641723633, -1.6092748641967773, 0.020294189453125, 1.649862289428711, 3.2794342041015625, 4.909002304077148, 6.538570880889893, 8.168139457702637, 9.797707557678223, 11.427275657653809, 13.056844711303711, 14.686412811279297, 16.315980911254883, 17.94554901123047, 19.575117111206055, 21.20468521118164, 22.83425521850586, 24.463821411132812, 26.09339141845703, 27.722959518432617, 29.352527618408203, 30.98209571838379, 32.611663818359375, 34.241233825683594, 35.87080001831055, 37.500370025634766, 39.12993621826172, 40.75950622558594, 42.389076232910156, 44.018646240234375, 45.64821243286133, 47.27778244018555, 48.9073486328125, 50.53691864013672, 52.16648864746094, 53.79605484008789, 55.425621032714844]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 5.0, 6.0, 10.0, 9.0, 16.0, 12.0, 11.0, 22.0, 24.0, 31.0, 23.0, 29.0, 22.0, 34.0, 30.0, 39.0, 43.0, 58.0, 42.0, 42.0, 34.0, 43.0, 38.0, 37.0, 37.0, 39.0, 32.0, 46.0, 31.0, 22.0, 21.0, 19.0, 15.0, 14.0, 13.0, 11.0, 13.0, 6.0, 4.0, 9.0, 2.0, 5.0, 2.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.62890625, -5.4361572265625, -5.243408203125, -5.0506591796875, -4.85791015625, -4.6651611328125, -4.472412109375, -4.2796630859375, -4.0869140625, -3.8941650390625, -3.701416015625, -3.5086669921875, -3.31591796875, -3.1231689453125, -2.930419921875, -2.7376708984375, -2.544921875, -2.3521728515625, -2.159423828125, -1.9666748046875, -1.77392578125, -1.5811767578125, -1.388427734375, -1.1956787109375, -1.0029296875, -0.8101806640625, -0.617431640625, -0.4246826171875, -0.23193359375, -0.0391845703125, 0.153564453125, 0.3463134765625, 0.5390625, 0.7318115234375, 0.924560546875, 1.1173095703125, 1.31005859375, 1.5028076171875, 1.695556640625, 1.8883056640625, 2.0810546875, 2.2738037109375, 2.466552734375, 2.6593017578125, 2.85205078125, 3.0447998046875, 3.237548828125, 3.4302978515625, 3.623046875, 3.8157958984375, 4.008544921875, 4.2012939453125, 4.39404296875, 4.5867919921875, 4.779541015625, 4.9722900390625, 5.1650390625, 5.3577880859375, 5.550537109375, 5.7432861328125, 5.93603515625, 6.1287841796875, 6.321533203125, 6.5142822265625, 6.70703125]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 7.0, 10.0, 9.0, 8.0, 10.0, 17.0, 21.0, 23.0, 26.0, 20.0, 23.0, 27.0, 19.0, 52.0, 84.0, 229.0, 941.0, 5483.0, 97002.0, 3231045.0, 838919.0, 17329.0, 2066.0, 426.0, 147.0, 69.0, 43.0, 41.0, 28.0, 28.0, 17.0, 19.0, 16.0, 19.0, 15.0, 7.0, 8.0, 10.0, 6.0, 3.0, 4.0, 3.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.96875, -21.177001953125, -20.38525390625, -19.593505859375, -18.8017578125, -18.010009765625, -17.21826171875, -16.426513671875, -15.634765625, -14.843017578125, -14.05126953125, -13.259521484375, -12.4677734375, -11.676025390625, -10.88427734375, -10.092529296875, -9.30078125, -8.509033203125, -7.71728515625, -6.925537109375, -6.1337890625, -5.342041015625, -4.55029296875, -3.758544921875, -2.966796875, -2.175048828125, -1.38330078125, -0.591552734375, 0.2001953125, 0.991943359375, 1.78369140625, 2.575439453125, 3.3671875, 4.158935546875, 4.95068359375, 5.742431640625, 6.5341796875, 7.325927734375, 8.11767578125, 8.909423828125, 9.701171875, 10.492919921875, 11.28466796875, 12.076416015625, 12.8681640625, 13.659912109375, 14.45166015625, 15.243408203125, 16.03515625, 16.826904296875, 17.61865234375, 18.410400390625, 19.2021484375, 19.993896484375, 20.78564453125, 21.577392578125, 22.369140625, 23.160888671875, 23.95263671875, 24.744384765625, 25.5361328125, 26.327880859375, 27.11962890625, 27.911376953125, 28.703125]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 5.0, 6.0, 2.0, 8.0, 15.0, 12.0, 12.0, 17.0, 24.0, 30.0, 24.0, 50.0, 55.0, 67.0, 95.0, 97.0, 117.0, 164.0, 217.0, 255.0, 319.0, 358.0, 352.0, 345.0, 298.0, 235.0, 203.0, 152.0, 114.0, 102.0, 71.0, 68.0, 46.0, 31.0, 33.0, 19.0, 17.0, 14.0, 5.0, 3.0, 7.0, 6.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-10.625, -10.3140869140625, -10.003173828125, -9.6922607421875, -9.38134765625, -9.0704345703125, -8.759521484375, -8.4486083984375, -8.1376953125, -7.8267822265625, -7.515869140625, -7.2049560546875, -6.89404296875, -6.5831298828125, -6.272216796875, -5.9613037109375, -5.650390625, -5.3394775390625, -5.028564453125, -4.7176513671875, -4.40673828125, -4.0958251953125, -3.784912109375, -3.4739990234375, -3.1630859375, -2.8521728515625, -2.541259765625, -2.2303466796875, -1.91943359375, -1.6085205078125, -1.297607421875, -0.9866943359375, -0.67578125, -0.3648681640625, -0.053955078125, 0.2569580078125, 0.56787109375, 0.8787841796875, 1.189697265625, 1.5006103515625, 1.8115234375, 2.1224365234375, 2.433349609375, 2.7442626953125, 3.05517578125, 3.3660888671875, 3.677001953125, 3.9879150390625, 4.298828125, 4.6097412109375, 4.920654296875, 5.2315673828125, 5.54248046875, 5.8533935546875, 6.164306640625, 6.4752197265625, 6.7861328125, 7.0970458984375, 7.407958984375, 7.7188720703125, 8.02978515625, 8.3406982421875, 8.651611328125, 8.9625244140625, 9.2734375]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 3.0, 5.0, 2.0, 9.0, 13.0, 11.0, 26.0, 28.0, 26.0, 46.0, 63.0, 101.0, 149.0, 218.0, 312.0, 807.0, 6086.0, 371188.0, 3763225.0, 48539.0, 2017.0, 543.0, 266.0, 156.0, 118.0, 76.0, 67.0, 44.0, 41.0, 27.0, 25.0, 10.0, 9.0, 7.0, 12.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.84375, -38.3837890625, -36.923828125, -35.4638671875, -34.00390625, -32.5439453125, -31.083984375, -29.6240234375, -28.1640625, -26.7041015625, -25.244140625, -23.7841796875, -22.32421875, -20.8642578125, -19.404296875, -17.9443359375, -16.484375, -15.0244140625, -13.564453125, -12.1044921875, -10.64453125, -9.1845703125, -7.724609375, -6.2646484375, -4.8046875, -3.3447265625, -1.884765625, -0.4248046875, 1.03515625, 2.4951171875, 3.955078125, 5.4150390625, 6.875, 8.3349609375, 9.794921875, 11.2548828125, 12.71484375, 14.1748046875, 15.634765625, 17.0947265625, 18.5546875, 20.0146484375, 21.474609375, 22.9345703125, 24.39453125, 25.8544921875, 27.314453125, 28.7744140625, 30.234375, 31.6943359375, 33.154296875, 34.6142578125, 36.07421875, 37.5341796875, 38.994140625, 40.4541015625, 41.9140625, 43.3740234375, 44.833984375, 46.2939453125, 47.75390625, 49.2138671875, 50.673828125, 52.1337890625, 53.59375]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 9.0, 59.0, 173.0, 295.0, 310.0, 127.0, 36.0, 9.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-187.20521545410156, -181.99156188964844, -176.77792358398438, -171.56427001953125, -166.35061645507812, -161.136962890625, -155.92330932617188, -150.7096710205078, -145.4960174560547, -140.28236389160156, -135.0687255859375, -129.85507202148438, -124.64141845703125, -119.42776489257812, -114.21411895751953, -109.00047302246094, -103.78681945800781, -98.57316589355469, -93.3595199584961, -88.1458740234375, -82.93222045898438, -77.71856689453125, -72.50492095947266, -67.29127502441406, -62.07762145996094, -56.86397171020508, -51.65032196044922, -46.43667221069336, -41.2230224609375, -36.00937271118164, -30.79572296142578, -25.582073211669922, -20.368423461914062, -15.154773712158203, -9.941123962402344, -4.727474212646484, 0.486175537109375, 5.699825286865234, 10.913475036621094, 16.127124786376953, 21.340774536132812, 26.554424285888672, 31.76807403564453, 36.98172378540039, 42.19537353515625, 47.40902328491211, 52.62267303466797, 57.83632278442383, 63.04997253417969, 68.26362609863281, 73.4772720336914, 78.69091796875, 83.90457153320312, 89.11822509765625, 94.33187103271484, 99.54551696777344, 104.75917053222656, 109.97282409667969, 115.18647003173828, 120.40011596679688, 125.61376953125, 130.82742309570312, 136.04107666015625, 141.2547149658203, 146.46836853027344]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 9.0, 2.0, 6.0, 5.0, 8.0, 9.0, 17.0, 14.0, 15.0, 27.0, 21.0, 26.0, 46.0, 29.0, 35.0, 39.0, 39.0, 38.0, 43.0, 38.0, 38.0, 40.0, 31.0, 41.0, 35.0, 40.0, 33.0, 25.0, 43.0, 36.0, 25.0, 30.0, 22.0, 15.0, 24.0, 17.0, 5.0, 11.0, 7.0, 1.0, 10.0, 5.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-40.928253173828125, -39.651458740234375, -38.374664306640625, -37.09787368774414, -35.82107925415039, -34.54428482055664, -33.26749038696289, -31.99069595336914, -30.713903427124023, -29.437108993530273, -28.160316467285156, -26.883522033691406, -25.606727600097656, -24.32993507385254, -23.05314064025879, -21.776348114013672, -20.499553680419922, -19.222759246826172, -17.945966720581055, -16.669172286987305, -15.392378807067871, -14.115585327148438, -12.838790893554688, -11.561997413635254, -10.28520393371582, -9.008410453796387, -7.731616497039795, -6.454822540283203, -5.1780290603637695, -3.901235580444336, -2.624441623687744, -1.3476476669311523, -0.07085800170898438, 1.2059357166290283, 2.482729434967041, 3.7595231533050537, 5.036316871643066, 6.3131103515625, 7.589904308319092, 8.866698265075684, 10.143491744995117, 11.42028522491455, 12.697078704833984, 13.973873138427734, 15.250666618347168, 16.5274600982666, 17.80425453186035, 19.08104705810547, 20.35784149169922, 21.63463592529297, 22.911428451538086, 24.188222885131836, 25.465015411376953, 26.741809844970703, 28.018604278564453, 29.295398712158203, 30.57219123840332, 31.84898567199707, 33.12577819824219, 34.40257263183594, 35.67936706542969, 36.95616149902344, 38.23295211791992, 39.50974655151367, 40.78654098510742]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 7.0, 2.0, 10.0, 8.0, 14.0, 19.0, 14.0, 16.0, 26.0, 19.0, 25.0, 33.0, 42.0, 27.0, 45.0, 20.0, 49.0, 30.0, 43.0, 32.0, 47.0, 51.0, 48.0, 42.0, 46.0, 26.0, 50.0, 36.0, 23.0, 26.0, 18.0, 14.0, 22.0, 15.0, 10.0, 6.0, 10.0, 9.0, 4.0, 11.0, 4.0, 7.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.5234375, -5.32684326171875, -5.1302490234375, -4.93365478515625, -4.737060546875, -4.54046630859375, -4.3438720703125, -4.14727783203125, -3.95068359375, -3.75408935546875, -3.5574951171875, -3.36090087890625, -3.164306640625, -2.96771240234375, -2.7711181640625, -2.57452392578125, -2.3779296875, -2.18133544921875, -1.9847412109375, -1.78814697265625, -1.591552734375, -1.39495849609375, -1.1983642578125, -1.00177001953125, -0.80517578125, -0.60858154296875, -0.4119873046875, -0.21539306640625, -0.018798828125, 0.17779541015625, 0.3743896484375, 0.57098388671875, 0.767578125, 0.96417236328125, 1.1607666015625, 1.35736083984375, 1.553955078125, 1.75054931640625, 1.9471435546875, 2.14373779296875, 2.34033203125, 2.53692626953125, 2.7335205078125, 2.93011474609375, 3.126708984375, 3.32330322265625, 3.5198974609375, 3.71649169921875, 3.9130859375, 4.10968017578125, 4.3062744140625, 4.50286865234375, 4.699462890625, 4.89605712890625, 5.0926513671875, 5.28924560546875, 5.48583984375, 5.68243408203125, 5.8790283203125, 6.07562255859375, 6.272216796875, 6.46881103515625, 6.6654052734375, 6.86199951171875, 7.05859375]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 3.0, 10.0, 8.0, 23.0, 44.0, 58.0, 93.0, 140.0, 249.0, 402.0, 639.0, 1037.0, 1647.0, 2623.0, 4221.0, 6869.0, 11272.0, 19178.0, 32383.0, 56394.0, 97039.0, 159933.0, 213022.0, 175589.0, 109701.0, 64459.0, 36964.0, 21565.0, 12881.0, 7626.0, 4764.0, 2869.0, 1835.0, 1111.0, 689.0, 447.0, 285.0, 168.0, 121.0, 59.0, 40.0, 38.0, 15.0, 15.0, 7.0, 4.0, 9.0, 4.0, 1.0, 1.0, 2.0], "bins": [-0.7861328125, -0.7640609741210938, -0.7419891357421875, -0.7199172973632812, -0.697845458984375, -0.6757736206054688, -0.6537017822265625, -0.6316299438476562, -0.60955810546875, -0.5874862670898438, -0.5654144287109375, -0.5433425903320312, -0.521270751953125, -0.49919891357421875, -0.4771270751953125, -0.45505523681640625, -0.4329833984375, -0.41091156005859375, -0.3888397216796875, -0.36676788330078125, -0.344696044921875, -0.32262420654296875, -0.3005523681640625, -0.27848052978515625, -0.25640869140625, -0.23433685302734375, -0.2122650146484375, -0.19019317626953125, -0.168121337890625, -0.14604949951171875, -0.1239776611328125, -0.10190582275390625, -0.079833984375, -0.05776214599609375, -0.0356903076171875, -0.01361846923828125, 0.008453369140625, 0.03052520751953125, 0.0525970458984375, 0.07466888427734375, 0.09674072265625, 0.11881256103515625, 0.1408843994140625, 0.16295623779296875, 0.185028076171875, 0.20709991455078125, 0.2291717529296875, 0.25124359130859375, 0.2733154296875, 0.29538726806640625, 0.3174591064453125, 0.33953094482421875, 0.361602783203125, 0.38367462158203125, 0.4057464599609375, 0.42781829833984375, 0.44989013671875, 0.47196197509765625, 0.4940338134765625, 0.5161056518554688, 0.538177490234375, 0.5602493286132812, 0.5823211669921875, 0.6043930053710938, 0.62646484375]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 3.0, 3.0, 11.0, 12.0, 10.0, 11.0, 10.0, 19.0, 21.0, 20.0, 28.0, 28.0, 20.0, 31.0, 39.0, 33.0, 58.0, 44.0, 38.0, 1080.0, 51.0, 35.0, 42.0, 44.0, 31.0, 53.0, 35.0, 37.0, 38.0, 27.0, 26.0, 13.0, 15.0, 8.0, 13.0, 9.0, 9.0, 9.0, 8.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.5390625, -4.40118408203125, -4.2633056640625, -4.12542724609375, -3.987548828125, -3.84967041015625, -3.7117919921875, -3.57391357421875, -3.43603515625, -3.29815673828125, -3.1602783203125, -3.02239990234375, -2.884521484375, -2.74664306640625, -2.6087646484375, -2.47088623046875, -2.3330078125, -2.19512939453125, -2.0572509765625, -1.91937255859375, -1.781494140625, -1.64361572265625, -1.5057373046875, -1.36785888671875, -1.22998046875, -1.09210205078125, -0.9542236328125, -0.81634521484375, -0.678466796875, -0.54058837890625, -0.4027099609375, -0.26483154296875, -0.126953125, 0.01092529296875, 0.1488037109375, 0.28668212890625, 0.424560546875, 0.56243896484375, 0.7003173828125, 0.83819580078125, 0.97607421875, 1.11395263671875, 1.2518310546875, 1.38970947265625, 1.527587890625, 1.66546630859375, 1.8033447265625, 1.94122314453125, 2.0791015625, 2.21697998046875, 2.3548583984375, 2.49273681640625, 2.630615234375, 2.76849365234375, 2.9063720703125, 3.04425048828125, 3.18212890625, 3.32000732421875, 3.4578857421875, 3.59576416015625, 3.733642578125, 3.87152099609375, 4.0093994140625, 4.14727783203125, 4.28515625]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 4.0, 5.0, 5.0, 10.0, 17.0, 25.0, 32.0, 55.0, 69.0, 86.0, 172.0, 274.0, 424.0, 635.0, 1094.0, 1689.0, 2528.0, 3986.0, 6246.0, 9811.0, 15546.0, 24074.0, 37630.0, 58271.0, 87229.0, 121375.0, 506172.0, 843562.0, 122644.0, 87970.0, 58836.0, 38234.0, 24604.0, 15843.0, 10051.0, 6532.0, 4094.0, 2677.0, 1686.0, 1028.0, 650.0, 444.0, 297.0, 207.0, 115.0, 81.0, 49.0, 30.0, 15.0, 12.0, 7.0, 3.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.409423828125, -0.395782470703125, -0.38214111328125, -0.368499755859375, -0.3548583984375, -0.341217041015625, -0.32757568359375, -0.313934326171875, -0.30029296875, -0.286651611328125, -0.27301025390625, -0.259368896484375, -0.2457275390625, -0.232086181640625, -0.21844482421875, -0.204803466796875, -0.191162109375, -0.177520751953125, -0.16387939453125, -0.150238037109375, -0.1365966796875, -0.122955322265625, -0.10931396484375, -0.095672607421875, -0.08203125, -0.068389892578125, -0.05474853515625, -0.041107177734375, -0.0274658203125, -0.013824462890625, -0.00018310546875, 0.013458251953125, 0.027099609375, 0.040740966796875, 0.05438232421875, 0.068023681640625, 0.0816650390625, 0.095306396484375, 0.10894775390625, 0.122589111328125, 0.13623046875, 0.149871826171875, 0.16351318359375, 0.177154541015625, 0.1907958984375, 0.204437255859375, 0.21807861328125, 0.231719970703125, 0.245361328125, 0.259002685546875, 0.27264404296875, 0.286285400390625, 0.2999267578125, 0.313568115234375, 0.32720947265625, 0.340850830078125, 0.3544921875, 0.368133544921875, 0.38177490234375, 0.395416259765625, 0.4090576171875, 0.422698974609375, 0.43634033203125, 0.449981689453125, 0.463623046875]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 8.0, 4.0, 6.0, 3.0, 7.0, 6.0, 8.0, 13.0, 12.0, 21.0, 26.0, 17.0, 32.0, 35.0, 46.0, 41.0, 58.0, 79.0, 74.0, 64.0, 65.0, 52.0, 61.0, 49.0, 36.0, 29.0, 27.0, 19.0, 19.0, 18.0, 8.0, 11.0, 11.0, 7.0, 5.0, 5.0, 7.0, 2.0, 4.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00431060791015625, -0.004188179969787598, -0.004065752029418945, -0.003943324089050293, -0.0038208961486816406, -0.0036984682083129883, -0.003576040267944336, -0.0034536123275756836, -0.0033311843872070312, -0.003208756446838379, -0.0030863285064697266, -0.0029639005661010742, -0.002841472625732422, -0.0027190446853637695, -0.002596616744995117, -0.002474188804626465, -0.0023517608642578125, -0.00222933292388916, -0.002106904983520508, -0.0019844770431518555, -0.0018620491027832031, -0.0017396211624145508, -0.0016171932220458984, -0.001494765281677246, -0.0013723373413085938, -0.0012499094009399414, -0.001127481460571289, -0.0010050535202026367, -0.0008826255798339844, -0.000760197639465332, -0.0006377696990966797, -0.0005153417587280273, -0.000392913818359375, -0.00027048587799072266, -0.0001480579376220703, -2.562999725341797e-05, 9.679794311523438e-05, 0.00021922588348388672, 0.00034165382385253906, 0.0004640817642211914, 0.0005865097045898438, 0.0007089376449584961, 0.0008313655853271484, 0.0009537935256958008, 0.0010762214660644531, 0.0011986494064331055, 0.0013210773468017578, 0.0014435052871704102, 0.0015659332275390625, 0.0016883611679077148, 0.0018107891082763672, 0.0019332170486450195, 0.002055644989013672, 0.0021780729293823242, 0.0023005008697509766, 0.002422928810119629, 0.0025453567504882812, 0.0026677846908569336, 0.002790212631225586, 0.0029126405715942383, 0.0030350685119628906, 0.003157496452331543, 0.0032799243927001953, 0.0034023523330688477, 0.0035247802734375]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 2.0, 4.0, 2.0, 1.0, 7.0, 11.0, 6.0, 12.0, 18.0, 17.0, 23.0, 22.0, 35.0, 57.0, 63.0, 126.0, 183.0, 316.0, 885.0, 34974.0, 1003709.0, 6674.0, 590.0, 279.0, 171.0, 107.0, 69.0, 28.0, 38.0, 29.0, 19.0, 14.0, 15.0, 18.0, 8.0, 3.0, 3.0, 5.0, 6.0, 3.0, 3.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.08575439453125, -0.08301925659179688, -0.08028411865234375, -0.07754898071289062, -0.0748138427734375, -0.07207870483398438, -0.06934356689453125, -0.06660842895507812, -0.063873291015625, -0.061138153076171875, -0.05840301513671875, -0.055667877197265625, -0.0529327392578125, -0.050197601318359375, -0.04746246337890625, -0.044727325439453125, -0.0419921875, -0.039257049560546875, -0.03652191162109375, -0.033786773681640625, -0.0310516357421875, -0.028316497802734375, -0.02558135986328125, -0.022846221923828125, -0.020111083984375, -0.017375946044921875, -0.01464080810546875, -0.011905670166015625, -0.0091705322265625, -0.006435394287109375, -0.00370025634765625, -0.000965118408203125, 0.00177001953125, 0.004505157470703125, 0.00724029541015625, 0.009975433349609375, 0.0127105712890625, 0.015445709228515625, 0.01818084716796875, 0.020915985107421875, 0.023651123046875, 0.026386260986328125, 0.02912139892578125, 0.031856536865234375, 0.0345916748046875, 0.037326812744140625, 0.04006195068359375, 0.042797088623046875, 0.0455322265625, 0.048267364501953125, 0.05100250244140625, 0.053737640380859375, 0.0564727783203125, 0.059207916259765625, 0.06194305419921875, 0.06467819213867188, 0.067413330078125, 0.07014846801757812, 0.07288360595703125, 0.07561874389648438, 0.0783538818359375, 0.08108901977539062, 0.08382415771484375, 0.08655929565429688, 0.08929443359375]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 10.0, 174.0, 731.0, 93.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0030269038397818804, -0.002339038299396634, -0.001651172642596066, -0.0009633069857954979, -0.0002754414454102516, 0.00041242409497499466, 0.0011002898681908846, 0.0017881554085761309, 0.002476020948961377, 0.0031638864893466234, 0.0038517522625625134, 0.00453961780294776, 0.005227483343333006, 0.005915348883718252, 0.006603214889764786, 0.007291080430150032, 0.007978945970535278, 0.008666811510920525, 0.009354677051305771, 0.010042542591691017, 0.010730408132076263, 0.01141827367246151, 0.012106139212846756, 0.012794004753232002, 0.013481870293617249, 0.014169735834002495, 0.014857601374387741, 0.015545466914772987, 0.016233332455158234, 0.01692119799554348, 0.017609063535928726, 0.018296929076313972, 0.018984796479344368, 0.019672662019729614, 0.02036052756011486, 0.021048393100500107, 0.021736258640885353, 0.0224241241812706, 0.023111989721655846, 0.023799855262041092, 0.024487720802426338, 0.025175586342811584, 0.02586345188319683, 0.026551317423582077, 0.027239182963967323, 0.02792704850435257, 0.028614914044737816, 0.029302779585123062, 0.029990646988153458, 0.030678512528538704, 0.03136637806892395, 0.032054245471954346, 0.03274210914969444, 0.03342997655272484, 0.034117840230464935, 0.03480570763349533, 0.03549357131123543, 0.03618143871426582, 0.03686930239200592, 0.037557169795036316, 0.03824503347277641, 0.03893290087580681, 0.039620764553546906, 0.0403086319565773, 0.0409964956343174]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 2.0, 2.0, 8.0, 12.0, 15.0, 17.0, 25.0, 28.0, 30.0, 35.0, 35.0, 50.0, 35.0, 38.0, 53.0, 41.0, 39.0, 39.0, 47.0, 51.0, 53.0, 45.0, 52.0, 37.0, 30.0, 26.0, 29.0, 21.0, 21.0, 14.0, 11.0, 16.0, 12.0, 14.0, 7.0, 1.0, 7.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0028460025787353516, -0.002757125534117222, -0.002668248489499092, -0.0025793714448809624, -0.0024904944002628326, -0.002401617355644703, -0.002312740311026573, -0.0022238632664084435, -0.0021349862217903137, -0.002046109177172184, -0.0019572321325540543, -0.0018683550879359245, -0.0017794780433177948, -0.001690600998699665, -0.0016017239540815353, -0.0015128469094634056, -0.0014239698648452759, -0.0013350928202271461, -0.0012462157756090164, -0.0011573387309908867, -0.001068461686372757, -0.0009795846417546272, -0.0008907075971364975, -0.0008018305525183678, -0.000712953507900238, -0.0006240764632821083, -0.0005351994186639786, -0.00044632237404584885, -0.0003574453294277191, -0.0002685682848095894, -0.00017969124019145966, -9.081419557332993e-05, -1.9371509552001953e-06, 8.693989366292953e-05, 0.00017581693828105927, 0.000264693982899189, 0.0003535710275173187, 0.00044244807213544846, 0.0005313251167535782, 0.0006202021613717079, 0.0007090792059898376, 0.0007979562506079674, 0.0008868332952260971, 0.0009757103398442268, 0.0010645873844623566, 0.0011534644290804863, 0.001242341473698616, 0.0013312185183167458, 0.0014200955629348755, 0.0015089726075530052, 0.001597849652171135, 0.0016867266967892647, 0.0017756037414073944, 0.0018644807860255241, 0.001953357830643654, 0.0020422348752617836, 0.0021311119198799133, 0.002219988964498043, 0.002308866009116173, 0.0023977430537343025, 0.0024866200983524323, 0.002575497142970562, 0.0026643741875886917, 0.0027532512322068214, 0.002842128276824951]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 7.0, 2.0, 10.0, 8.0, 14.0, 19.0, 14.0, 16.0, 26.0, 19.0, 25.0, 33.0, 42.0, 27.0, 46.0, 19.0, 49.0, 30.0, 43.0, 32.0, 47.0, 51.0, 48.0, 42.0, 46.0, 26.0, 50.0, 36.0, 23.0, 26.0, 18.0, 14.0, 22.0, 15.0, 10.0, 6.0, 10.0, 9.0, 4.0, 11.0, 4.0, 7.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.5234375, -5.32684326171875, -5.1302490234375, -4.93365478515625, -4.737060546875, -4.54046630859375, -4.3438720703125, -4.14727783203125, -3.95068359375, -3.75408935546875, -3.5574951171875, -3.36090087890625, -3.164306640625, -2.96771240234375, -2.7711181640625, -2.57452392578125, -2.3779296875, -2.18133544921875, -1.9847412109375, -1.78814697265625, -1.591552734375, -1.39495849609375, -1.1983642578125, -1.00177001953125, -0.80517578125, -0.60858154296875, -0.4119873046875, -0.21539306640625, -0.018798828125, 0.17779541015625, 0.3743896484375, 0.57098388671875, 0.767578125, 0.96417236328125, 1.1607666015625, 1.35736083984375, 1.553955078125, 1.75054931640625, 1.9471435546875, 2.14373779296875, 2.34033203125, 2.53692626953125, 2.7335205078125, 2.93011474609375, 3.126708984375, 3.32330322265625, 3.5198974609375, 3.71649169921875, 3.9130859375, 4.10968017578125, 4.3062744140625, 4.50286865234375, 4.699462890625, 4.89605712890625, 5.0926513671875, 5.28924560546875, 5.48583984375, 5.68243408203125, 5.8790283203125, 6.07562255859375, 6.272216796875, 6.46881103515625, 6.6654052734375, 6.86199951171875, 7.05859375]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 3.0, 5.0, 11.0, 10.0, 16.0, 14.0, 20.0, 31.0, 59.0, 79.0, 115.0, 183.0, 341.0, 550.0, 965.0, 1789.0, 3440.0, 6680.0, 14493.0, 39002.0, 123582.0, 447300.0, 279982.0, 80562.0, 27073.0, 10958.0, 5087.0, 2693.0, 1473.0, 821.0, 484.0, 276.0, 153.0, 98.0, 61.0, 42.0, 26.0, 27.0, 19.0, 7.0, 8.0, 7.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.62109375, -5.438720703125, -5.25634765625, -5.073974609375, -4.8916015625, -4.709228515625, -4.52685546875, -4.344482421875, -4.162109375, -3.979736328125, -3.79736328125, -3.614990234375, -3.4326171875, -3.250244140625, -3.06787109375, -2.885498046875, -2.703125, -2.520751953125, -2.33837890625, -2.156005859375, -1.9736328125, -1.791259765625, -1.60888671875, -1.426513671875, -1.244140625, -1.061767578125, -0.87939453125, -0.697021484375, -0.5146484375, -0.332275390625, -0.14990234375, 0.032470703125, 0.21484375, 0.397216796875, 0.57958984375, 0.761962890625, 0.9443359375, 1.126708984375, 1.30908203125, 1.491455078125, 1.673828125, 1.856201171875, 2.03857421875, 2.220947265625, 2.4033203125, 2.585693359375, 2.76806640625, 2.950439453125, 3.1328125, 3.315185546875, 3.49755859375, 3.679931640625, 3.8623046875, 4.044677734375, 4.22705078125, 4.409423828125, 4.591796875, 4.774169921875, 4.95654296875, 5.138916015625, 5.3212890625, 5.503662109375, 5.68603515625, 5.868408203125, 6.05078125]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 2.0, 4.0, 7.0, 9.0, 10.0, 7.0, 15.0, 13.0, 13.0, 10.0, 24.0, 18.0, 27.0, 30.0, 35.0, 36.0, 32.0, 41.0, 61.0, 51.0, 69.0, 140.0, 1481.0, 322.0, 125.0, 80.0, 46.0, 38.0, 43.0, 32.0, 31.0, 31.0, 23.0, 28.0, 23.0, 16.0, 16.0, 15.0, 11.0, 9.0, 4.0, 7.0, 5.0, 2.0, 1.0, 2.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-19.09375, -18.49560546875, -17.8974609375, -17.29931640625, -16.701171875, -16.10302734375, -15.5048828125, -14.90673828125, -14.30859375, -13.71044921875, -13.1123046875, -12.51416015625, -11.916015625, -11.31787109375, -10.7197265625, -10.12158203125, -9.5234375, -8.92529296875, -8.3271484375, -7.72900390625, -7.130859375, -6.53271484375, -5.9345703125, -5.33642578125, -4.73828125, -4.14013671875, -3.5419921875, -2.94384765625, -2.345703125, -1.74755859375, -1.1494140625, -0.55126953125, 0.046875, 0.64501953125, 1.2431640625, 1.84130859375, 2.439453125, 3.03759765625, 3.6357421875, 4.23388671875, 4.83203125, 5.43017578125, 6.0283203125, 6.62646484375, 7.224609375, 7.82275390625, 8.4208984375, 9.01904296875, 9.6171875, 10.21533203125, 10.8134765625, 11.41162109375, 12.009765625, 12.60791015625, 13.2060546875, 13.80419921875, 14.40234375, 15.00048828125, 15.5986328125, 16.19677734375, 16.794921875, 17.39306640625, 17.9912109375, 18.58935546875, 19.1875]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 8.0, 11.0, 21.0, 22.0, 48.0, 50.0, 94.0, 138.0, 198.0, 355.0, 845.0, 17680.0, 3120232.0, 4380.0, 695.0, 342.0, 194.0, 135.0, 77.0, 58.0, 31.0, 36.0, 14.0, 14.0, 8.0, 11.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-98.1875, -95.75537109375, -93.3232421875, -90.89111328125, -88.458984375, -86.02685546875, -83.5947265625, -81.16259765625, -78.73046875, -76.29833984375, -73.8662109375, -71.43408203125, -69.001953125, -66.56982421875, -64.1376953125, -61.70556640625, -59.2734375, -56.84130859375, -54.4091796875, -51.97705078125, -49.544921875, -47.11279296875, -44.6806640625, -42.24853515625, -39.81640625, -37.38427734375, -34.9521484375, -32.52001953125, -30.087890625, -27.65576171875, -25.2236328125, -22.79150390625, -20.359375, -17.92724609375, -15.4951171875, -13.06298828125, -10.630859375, -8.19873046875, -5.7666015625, -3.33447265625, -0.90234375, 1.52978515625, 3.9619140625, 6.39404296875, 8.826171875, 11.25830078125, 13.6904296875, 16.12255859375, 18.5546875, 20.98681640625, 23.4189453125, 25.85107421875, 28.283203125, 30.71533203125, 33.1474609375, 35.57958984375, 38.01171875, 40.44384765625, 42.8759765625, 45.30810546875, 47.740234375, 50.17236328125, 52.6044921875, 55.03662109375, 57.46875]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 7.0, 29.0, 165.0, 345.0, 291.0, 139.0, 30.0, 6.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.14201354980469, -51.978763580322266, -49.815513610839844, -47.652259826660156, -45.489009857177734, -43.32575988769531, -41.16250991821289, -38.99925994873047, -36.83600616455078, -34.67275619506836, -32.50950622558594, -30.346254348754883, -28.183002471923828, -26.019752502441406, -23.856502532958984, -21.693252563476562, -19.53000259399414, -17.36675262451172, -15.203500747680664, -13.040250778198242, -10.876999855041504, -8.713748931884766, -6.550498962402344, -4.3872480392456055, -2.223997116088867, -0.06074643135070801, 2.102504253387451, 4.265754699707031, 6.4290056228637695, 8.592256546020508, 10.75550651550293, 12.918757438659668, 15.082008361816406, 17.245258331298828, 19.408510208129883, 21.571760177612305, 23.73501205444336, 25.89826202392578, 28.061511993408203, 30.224761962890625, 32.38801574707031, 34.551265716552734, 36.714515686035156, 38.877769470214844, 41.041019439697266, 43.20426940917969, 45.36751937866211, 47.53076934814453, 49.69401931762695, 51.857269287109375, 54.0205192565918, 56.18376922607422, 58.347023010253906, 60.51027297973633, 62.67352294921875, 64.83677673339844, 67.0000228881836, 69.16327667236328, 71.32652282714844, 73.48977661132812, 75.65302276611328, 77.81627655029297, 79.97952270507812, 82.14277648925781, 84.3060302734375]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 8.0, 6.0, 3.0, 6.0, 9.0, 5.0, 16.0, 15.0, 13.0, 18.0, 17.0, 21.0, 20.0, 24.0, 25.0, 23.0, 28.0, 40.0, 42.0, 31.0, 42.0, 50.0, 33.0, 47.0, 35.0, 29.0, 41.0, 35.0, 38.0, 27.0, 36.0, 27.0, 33.0, 24.0, 19.0, 16.0, 11.0, 12.0, 14.0, 9.0, 7.0, 11.0, 9.0, 10.0, 8.0, 5.0, 1.0, 1.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-53.2945556640625, -51.62506866455078, -49.95558166503906, -48.286094665527344, -46.616607666015625, -44.947120666503906, -43.27763748168945, -41.608150482177734, -39.938663482666016, -38.2691764831543, -36.59968948364258, -34.93020248413086, -33.260719299316406, -31.591230392456055, -29.92174530029297, -28.25225830078125, -26.58277130126953, -24.913284301757812, -23.243797302246094, -21.574312210083008, -19.90482521057129, -18.23533821105957, -16.565853118896484, -14.896366119384766, -13.226879119873047, -11.557392120361328, -9.887906074523926, -8.218420028686523, -6.548933029174805, -4.879446029663086, -3.2099599838256836, -1.5404739379882812, 0.1290130615234375, 1.798499584197998, 3.4679861068725586, 5.137472629547119, 6.80695915222168, 8.476446151733398, 10.1459321975708, 11.815418243408203, 13.484905242919922, 15.15439224243164, 16.82387924194336, 18.493364334106445, 20.162851333618164, 21.832338333129883, 23.50182342529297, 25.171310424804688, 26.840797424316406, 28.510284423828125, 30.179771423339844, 31.84925651550293, 33.51874542236328, 35.188232421875, 36.85771560668945, 38.52720260620117, 40.19668960571289, 41.86617660522461, 43.53566360473633, 45.20515060424805, 46.8746337890625, 48.54412078857422, 50.21360778808594, 51.883094787597656, 53.552581787109375]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 9.0, 10.0, 13.0, 12.0, 23.0, 17.0, 20.0, 24.0, 18.0, 34.0, 40.0, 33.0, 34.0, 48.0, 35.0, 34.0, 36.0, 44.0, 46.0, 48.0, 51.0, 43.0, 39.0, 38.0, 44.0, 24.0, 34.0, 17.0, 29.0, 14.0, 26.0, 16.0, 8.0, 7.0, 2.0, 11.0, 6.0, 6.0, 2.0, 8.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.09765625, -5.880126953125, -5.66259765625, -5.445068359375, -5.2275390625, -5.010009765625, -4.79248046875, -4.574951171875, -4.357421875, -4.139892578125, -3.92236328125, -3.704833984375, -3.4873046875, -3.269775390625, -3.05224609375, -2.834716796875, -2.6171875, -2.399658203125, -2.18212890625, -1.964599609375, -1.7470703125, -1.529541015625, -1.31201171875, -1.094482421875, -0.876953125, -0.659423828125, -0.44189453125, -0.224365234375, -0.0068359375, 0.210693359375, 0.42822265625, 0.645751953125, 0.86328125, 1.080810546875, 1.29833984375, 1.515869140625, 1.7333984375, 1.950927734375, 2.16845703125, 2.385986328125, 2.603515625, 2.821044921875, 3.03857421875, 3.256103515625, 3.4736328125, 3.691162109375, 3.90869140625, 4.126220703125, 4.34375, 4.561279296875, 4.77880859375, 4.996337890625, 5.2138671875, 5.431396484375, 5.64892578125, 5.866455078125, 6.083984375, 6.301513671875, 6.51904296875, 6.736572265625, 6.9541015625, 7.171630859375, 7.38916015625, 7.606689453125, 7.82421875]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 0.0, 6.0, 2.0, 7.0, 11.0, 12.0, 16.0, 22.0, 23.0, 24.0, 24.0, 31.0, 37.0, 45.0, 65.0, 139.0, 476.0, 2103.0, 16446.0, 531872.0, 3454642.0, 177468.0, 8556.0, 1462.0, 357.0, 129.0, 73.0, 45.0, 36.0, 29.0, 24.0, 23.0, 17.0, 16.0, 8.0, 11.0, 5.0, 9.0, 2.0, 7.0, 9.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.453125, -21.661865234375, -20.87060546875, -20.079345703125, -19.2880859375, -18.496826171875, -17.70556640625, -16.914306640625, -16.123046875, -15.331787109375, -14.54052734375, -13.749267578125, -12.9580078125, -12.166748046875, -11.37548828125, -10.584228515625, -9.79296875, -9.001708984375, -8.21044921875, -7.419189453125, -6.6279296875, -5.836669921875, -5.04541015625, -4.254150390625, -3.462890625, -2.671630859375, -1.88037109375, -1.089111328125, -0.2978515625, 0.493408203125, 1.28466796875, 2.075927734375, 2.8671875, 3.658447265625, 4.44970703125, 5.240966796875, 6.0322265625, 6.823486328125, 7.61474609375, 8.406005859375, 9.197265625, 9.988525390625, 10.77978515625, 11.571044921875, 12.3623046875, 13.153564453125, 13.94482421875, 14.736083984375, 15.52734375, 16.318603515625, 17.10986328125, 17.901123046875, 18.6923828125, 19.483642578125, 20.27490234375, 21.066162109375, 21.857421875, 22.648681640625, 23.43994140625, 24.231201171875, 25.0224609375, 25.813720703125, 26.60498046875, 27.396240234375, 28.1875]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 8.0, 6.0, 6.0, 12.0, 23.0, 17.0, 28.0, 28.0, 50.0, 53.0, 78.0, 100.0, 138.0, 170.0, 278.0, 350.0, 404.0, 497.0, 435.0, 359.0, 251.0, 196.0, 161.0, 122.0, 79.0, 74.0, 49.0, 25.0, 22.0, 18.0, 10.0, 8.0, 8.0, 3.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-11.5859375, -11.1800537109375, -10.774169921875, -10.3682861328125, -9.96240234375, -9.5565185546875, -9.150634765625, -8.7447509765625, -8.3388671875, -7.9329833984375, -7.527099609375, -7.1212158203125, -6.71533203125, -6.3094482421875, -5.903564453125, -5.4976806640625, -5.091796875, -4.6859130859375, -4.280029296875, -3.8741455078125, -3.46826171875, -3.0623779296875, -2.656494140625, -2.2506103515625, -1.8447265625, -1.4388427734375, -1.032958984375, -0.6270751953125, -0.22119140625, 0.1846923828125, 0.590576171875, 0.9964599609375, 1.40234375, 1.8082275390625, 2.214111328125, 2.6199951171875, 3.02587890625, 3.4317626953125, 3.837646484375, 4.2435302734375, 4.6494140625, 5.0552978515625, 5.461181640625, 5.8670654296875, 6.27294921875, 6.6788330078125, 7.084716796875, 7.4906005859375, 7.896484375, 8.3023681640625, 8.708251953125, 9.1141357421875, 9.52001953125, 9.9259033203125, 10.331787109375, 10.7376708984375, 11.1435546875, 11.5494384765625, 11.955322265625, 12.3612060546875, 12.76708984375, 13.1729736328125, 13.578857421875, 13.9847412109375, 14.390625]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 7.0, 6.0, 14.0, 10.0, 16.0, 33.0, 26.0, 35.0, 51.0, 99.0, 98.0, 148.0, 171.0, 234.0, 312.0, 706.0, 3268.0, 134564.0, 3938568.0, 111124.0, 2926.0, 636.0, 301.0, 215.0, 164.0, 108.0, 103.0, 62.0, 59.0, 62.0, 37.0, 36.0, 21.0, 18.0, 10.0, 19.0, 8.0, 3.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0], "bins": [-54.0625, -52.58056640625, -51.0986328125, -49.61669921875, -48.134765625, -46.65283203125, -45.1708984375, -43.68896484375, -42.20703125, -40.72509765625, -39.2431640625, -37.76123046875, -36.279296875, -34.79736328125, -33.3154296875, -31.83349609375, -30.3515625, -28.86962890625, -27.3876953125, -25.90576171875, -24.423828125, -22.94189453125, -21.4599609375, -19.97802734375, -18.49609375, -17.01416015625, -15.5322265625, -14.05029296875, -12.568359375, -11.08642578125, -9.6044921875, -8.12255859375, -6.640625, -5.15869140625, -3.6767578125, -2.19482421875, -0.712890625, 0.76904296875, 2.2509765625, 3.73291015625, 5.21484375, 6.69677734375, 8.1787109375, 9.66064453125, 11.142578125, 12.62451171875, 14.1064453125, 15.58837890625, 17.0703125, 18.55224609375, 20.0341796875, 21.51611328125, 22.998046875, 24.47998046875, 25.9619140625, 27.44384765625, 28.92578125, 30.40771484375, 31.8896484375, 33.37158203125, 34.853515625, 36.33544921875, 37.8173828125, 39.29931640625, 40.78125]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 6.0, 4.0, 7.0, 17.0, 25.0, 59.0, 83.0, 119.0, 158.0, 128.0, 137.0, 107.0, 67.0, 50.0, 21.0, 10.0, 11.0, 3.0, 0.0, 2.0, 1.0, 1.0], "bins": [-115.23910522460938, -112.9880599975586, -110.73701477050781, -108.48597717285156, -106.23493194580078, -103.98388671875, -101.73284912109375, -99.48180389404297, -97.23075866699219, -94.9797134399414, -92.72866821289062, -90.47763061523438, -88.2265853881836, -85.97554016113281, -83.72450256347656, -81.47345733642578, -79.222412109375, -76.97136688232422, -74.72032165527344, -72.46928405761719, -70.2182388305664, -67.96719360351562, -65.71615600585938, -63.465110778808594, -61.21406555175781, -58.96302032470703, -56.711978912353516, -54.4609375, -52.20989227294922, -49.95884704589844, -47.70780563354492, -45.456764221191406, -43.205718994140625, -40.954673767089844, -38.70363235473633, -36.45259094238281, -34.20154571533203, -31.950502395629883, -29.699459075927734, -27.448415756225586, -25.197372436523438, -22.94632911682129, -20.69528579711914, -18.444242477416992, -16.193199157714844, -13.942155838012695, -11.691112518310547, -9.440069198608398, -7.18902587890625, -4.937982559204102, -2.686939239501953, -0.4358959197998047, 1.8151473999023438, 4.066190719604492, 6.317234039306641, 8.568277359008789, 10.819320678710938, 13.070363998413086, 15.321407318115234, 17.572450637817383, 19.82349395751953, 22.07453727722168, 24.325580596923828, 26.576623916625977, 28.827667236328125]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 2.0, 5.0, 6.0, 5.0, 7.0, 9.0, 10.0, 5.0, 13.0, 13.0, 13.0, 23.0, 24.0, 20.0, 32.0, 32.0, 28.0, 28.0, 34.0, 32.0, 32.0, 41.0, 39.0, 33.0, 50.0, 38.0, 40.0, 44.0, 35.0, 38.0, 30.0, 30.0, 33.0, 20.0, 21.0, 19.0, 22.0, 20.0, 9.0, 19.0, 12.0, 7.0, 5.0, 7.0, 6.0, 5.0, 3.0, 2.0, 1.0, 6.0, 1.0, 3.0, 0.0, 2.0], "bins": [-43.00483703613281, -41.735206604003906, -40.465576171875, -39.195945739746094, -37.92631530761719, -36.65668487548828, -35.387054443359375, -34.11742401123047, -32.84779357910156, -31.578163146972656, -30.30853271484375, -29.038902282714844, -27.769271850585938, -26.49964141845703, -25.230010986328125, -23.96038055419922, -22.69074821472168, -21.421117782592773, -20.151487350463867, -18.88185691833496, -17.612226486206055, -16.34259605407715, -15.072964668273926, -13.80333423614502, -12.533703804016113, -11.264073371887207, -9.9944429397583, -8.724811553955078, -7.45518159866333, -6.185551166534424, -4.915920257568359, -3.646289825439453, -2.376659393310547, -1.107028841972351, 0.16260170936584473, 1.43223237991333, 2.7018628120422363, 3.9714932441711426, 5.241124153137207, 6.510754585266113, 7.7803850173950195, 9.050015449523926, 10.319645881652832, 11.589277267456055, 12.858907699584961, 14.128538131713867, 15.398168563842773, 16.66779899597168, 17.937429428100586, 19.207059860229492, 20.4766902923584, 21.746320724487305, 23.01595115661621, 24.285581588745117, 25.555213928222656, 26.824844360351562, 28.09447479248047, 29.364105224609375, 30.63373565673828, 31.903366088867188, 33.172996520996094, 34.442626953125, 35.712257385253906, 36.98188781738281, 38.25151824951172]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 6.0, 13.0, 10.0, 6.0, 8.0, 11.0, 22.0, 15.0, 25.0, 22.0, 17.0, 21.0, 26.0, 31.0, 34.0, 36.0, 47.0, 40.0, 29.0, 44.0, 41.0, 32.0, 44.0, 43.0, 38.0, 35.0, 33.0, 37.0, 28.0, 25.0, 28.0, 20.0, 22.0, 21.0, 16.0, 17.0, 4.0, 7.0, 13.0, 4.0, 9.0, 6.0, 3.0, 5.0, 4.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.26171875, -5.07354736328125, -4.8853759765625, -4.69720458984375, -4.509033203125, -4.32086181640625, -4.1326904296875, -3.94451904296875, -3.75634765625, -3.56817626953125, -3.3800048828125, -3.19183349609375, -3.003662109375, -2.81549072265625, -2.6273193359375, -2.43914794921875, -2.2509765625, -2.06280517578125, -1.8746337890625, -1.68646240234375, -1.498291015625, -1.31011962890625, -1.1219482421875, -0.93377685546875, -0.74560546875, -0.55743408203125, -0.3692626953125, -0.18109130859375, 0.007080078125, 0.19525146484375, 0.3834228515625, 0.57159423828125, 0.759765625, 0.94793701171875, 1.1361083984375, 1.32427978515625, 1.512451171875, 1.70062255859375, 1.8887939453125, 2.07696533203125, 2.26513671875, 2.45330810546875, 2.6414794921875, 2.82965087890625, 3.017822265625, 3.20599365234375, 3.3941650390625, 3.58233642578125, 3.7705078125, 3.95867919921875, 4.1468505859375, 4.33502197265625, 4.523193359375, 4.71136474609375, 4.8995361328125, 5.08770751953125, 5.27587890625, 5.46405029296875, 5.6522216796875, 5.84039306640625, 6.028564453125, 6.21673583984375, 6.4049072265625, 6.59307861328125, 6.78125]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 7.0, 26.0, 21.0, 30.0, 67.0, 69.0, 115.0, 162.0, 273.0, 385.0, 583.0, 1000.0, 1649.0, 2700.0, 4519.0, 7448.0, 12728.0, 22059.0, 38313.0, 68366.0, 120543.0, 193181.0, 217486.0, 151132.0, 88146.0, 49291.0, 28197.0, 16300.0, 9444.0, 5595.0, 3291.0, 2009.0, 1240.0, 783.0, 490.0, 303.0, 209.0, 141.0, 69.0, 63.0, 27.0, 25.0, 20.0, 9.0, 15.0, 10.0, 3.0, 2.0, 1.0, 8.0, 1.0, 2.0], "bins": [-0.8544921875, -0.8295211791992188, -0.8045501708984375, -0.7795791625976562, -0.754608154296875, -0.7296371459960938, -0.7046661376953125, -0.6796951293945312, -0.65472412109375, -0.6297531127929688, -0.6047821044921875, -0.5798110961914062, -0.554840087890625, -0.5298690795898438, -0.5048980712890625, -0.47992706298828125, -0.4549560546875, -0.42998504638671875, -0.4050140380859375, -0.38004302978515625, -0.355072021484375, -0.33010101318359375, -0.3051300048828125, -0.28015899658203125, -0.25518798828125, -0.23021697998046875, -0.2052459716796875, -0.18027496337890625, -0.155303955078125, -0.13033294677734375, -0.1053619384765625, -0.08039093017578125, -0.055419921875, -0.03044891357421875, -0.0054779052734375, 0.01949310302734375, 0.044464111328125, 0.06943511962890625, 0.0944061279296875, 0.11937713623046875, 0.14434814453125, 0.16931915283203125, 0.1942901611328125, 0.21926116943359375, 0.244232177734375, 0.26920318603515625, 0.2941741943359375, 0.31914520263671875, 0.3441162109375, 0.36908721923828125, 0.3940582275390625, 0.41902923583984375, 0.444000244140625, 0.46897125244140625, 0.4939422607421875, 0.5189132690429688, 0.54388427734375, 0.5688552856445312, 0.5938262939453125, 0.6187973022460938, 0.643768310546875, 0.6687393188476562, 0.6937103271484375, 0.7186813354492188, 0.74365234375]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 9.0, 2.0, 4.0, 11.0, 13.0, 13.0, 14.0, 11.0, 13.0, 19.0, 26.0, 21.0, 32.0, 28.0, 30.0, 36.0, 31.0, 32.0, 32.0, 37.0, 36.0, 32.0, 1066.0, 37.0, 36.0, 38.0, 31.0, 38.0, 26.0, 36.0, 25.0, 23.0, 26.0, 26.0, 19.0, 16.0, 7.0, 17.0, 11.0, 16.0, 14.0, 8.0, 4.0, 6.0, 6.0, 5.0, 6.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.509765625, -3.39788818359375, -3.2860107421875, -3.17413330078125, -3.062255859375, -2.95037841796875, -2.8385009765625, -2.72662353515625, -2.61474609375, -2.50286865234375, -2.3909912109375, -2.27911376953125, -2.167236328125, -2.05535888671875, -1.9434814453125, -1.83160400390625, -1.7197265625, -1.60784912109375, -1.4959716796875, -1.38409423828125, -1.272216796875, -1.16033935546875, -1.0484619140625, -0.93658447265625, -0.82470703125, -0.71282958984375, -0.6009521484375, -0.48907470703125, -0.377197265625, -0.26531982421875, -0.1534423828125, -0.04156494140625, 0.0703125, 0.18218994140625, 0.2940673828125, 0.40594482421875, 0.517822265625, 0.62969970703125, 0.7415771484375, 0.85345458984375, 0.96533203125, 1.07720947265625, 1.1890869140625, 1.30096435546875, 1.412841796875, 1.52471923828125, 1.6365966796875, 1.74847412109375, 1.8603515625, 1.97222900390625, 2.0841064453125, 2.19598388671875, 2.307861328125, 2.41973876953125, 2.5316162109375, 2.64349365234375, 2.75537109375, 2.86724853515625, 2.9791259765625, 3.09100341796875, 3.202880859375, 3.31475830078125, 3.4266357421875, 3.53851318359375, 3.650390625]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 5.0, 9.0, 15.0, 19.0, 31.0, 78.0, 96.0, 215.0, 277.0, 446.0, 685.0, 1219.0, 1887.0, 2982.0, 4802.0, 7588.0, 11936.0, 19156.0, 30000.0, 47377.0, 73601.0, 110181.0, 148516.0, 1211482.0, 140107.0, 100719.0, 67169.0, 43015.0, 27496.0, 16985.0, 10812.0, 6888.0, 4241.0, 2692.0, 1684.0, 1054.0, 648.0, 403.0, 252.0, 144.0, 79.0, 57.0, 36.0, 16.0, 23.0, 7.0, 5.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.46044921875, -0.4457817077636719, -0.43111419677734375, -0.4164466857910156, -0.4017791748046875, -0.3871116638183594, -0.37244415283203125, -0.3577766418457031, -0.343109130859375, -0.3284416198730469, -0.31377410888671875, -0.2991065979003906, -0.2844390869140625, -0.2697715759277344, -0.25510406494140625, -0.24043655395507812, -0.22576904296875, -0.21110153198242188, -0.19643402099609375, -0.18176651000976562, -0.1670989990234375, -0.15243148803710938, -0.13776397705078125, -0.12309646606445312, -0.108428955078125, -0.09376144409179688, -0.07909393310546875, -0.06442642211914062, -0.0497589111328125, -0.035091400146484375, -0.02042388916015625, -0.005756378173828125, 0.0089111328125, 0.023578643798828125, 0.03824615478515625, 0.052913665771484375, 0.0675811767578125, 0.08224868774414062, 0.09691619873046875, 0.11158370971679688, 0.126251220703125, 0.14091873168945312, 0.15558624267578125, 0.17025375366210938, 0.1849212646484375, 0.19958877563476562, 0.21425628662109375, 0.22892379760742188, 0.24359130859375, 0.2582588195800781, 0.27292633056640625, 0.2875938415527344, 0.3022613525390625, 0.3169288635253906, 0.33159637451171875, 0.3462638854980469, 0.360931396484375, 0.3755989074707031, 0.39026641845703125, 0.4049339294433594, 0.4196014404296875, 0.4342689514160156, 0.44893646240234375, 0.4636039733886719, 0.478271484375]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 8.0, 3.0, 4.0, 4.0, 5.0, 10.0, 11.0, 15.0, 19.0, 21.0, 20.0, 17.0, 34.0, 32.0, 34.0, 45.0, 51.0, 67.0, 84.0, 72.0, 68.0, 56.0, 53.0, 37.0, 46.0, 39.0, 36.0, 27.0, 11.0, 12.0, 18.0, 10.0, 11.0, 6.0, 5.0, 5.0, 4.0, 1.0, 0.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0042572021484375, -0.004100680351257324, -0.0039441585540771484, -0.0037876367568969727, -0.003631114959716797, -0.003474593162536621, -0.0033180713653564453, -0.0031615495681762695, -0.0030050277709960938, -0.002848505973815918, -0.002691984176635742, -0.0025354623794555664, -0.0023789405822753906, -0.002222418785095215, -0.002065896987915039, -0.0019093751907348633, -0.0017528533935546875, -0.0015963315963745117, -0.001439809799194336, -0.0012832880020141602, -0.0011267662048339844, -0.0009702444076538086, -0.0008137226104736328, -0.000657200813293457, -0.0005006790161132812, -0.00034415721893310547, -0.0001876354217529297, -3.1113624572753906e-05, 0.00012540817260742188, 0.00028192996978759766, 0.00043845176696777344, 0.0005949735641479492, 0.000751495361328125, 0.0009080171585083008, 0.0010645389556884766, 0.0012210607528686523, 0.0013775825500488281, 0.001534104347229004, 0.0016906261444091797, 0.0018471479415893555, 0.0020036697387695312, 0.002160191535949707, 0.002316713333129883, 0.0024732351303100586, 0.0026297569274902344, 0.00278627872467041, 0.002942800521850586, 0.0030993223190307617, 0.0032558441162109375, 0.0034123659133911133, 0.003568887710571289, 0.003725409507751465, 0.0038819313049316406, 0.004038453102111816, 0.004194974899291992, 0.004351496696472168, 0.004508018493652344, 0.0046645402908325195, 0.004821062088012695, 0.004977583885192871, 0.005134105682373047, 0.005290627479553223, 0.0054471492767333984, 0.005603671073913574, 0.00576019287109375]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 1.0, 8.0, 3.0, 1.0, 10.0, 14.0, 12.0, 16.0, 20.0, 23.0, 27.0, 47.0, 64.0, 61.0, 95.0, 151.0, 230.0, 536.0, 4533.0, 844770.0, 194827.0, 2039.0, 414.0, 163.0, 109.0, 66.0, 62.0, 60.0, 28.0, 23.0, 38.0, 28.0, 15.0, 8.0, 15.0, 6.0, 5.0, 7.0, 2.0, 5.0, 7.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.11370849609375, -0.11062431335449219, -0.10754013061523438, -0.10445594787597656, -0.10137176513671875, -0.09828758239746094, -0.09520339965820312, -0.09211921691894531, -0.0890350341796875, -0.08595085144042969, -0.08286666870117188, -0.07978248596191406, -0.07669830322265625, -0.07361412048339844, -0.07052993774414062, -0.06744575500488281, -0.064361572265625, -0.06127738952636719, -0.058193206787109375, -0.05510902404785156, -0.05202484130859375, -0.04894065856933594, -0.045856475830078125, -0.04277229309082031, -0.0396881103515625, -0.03660392761230469, -0.033519744873046875, -0.030435562133789062, -0.02735137939453125, -0.024267196655273438, -0.021183013916015625, -0.018098831176757812, -0.0150146484375, -0.011930465698242188, -0.008846282958984375, -0.0057621002197265625, -0.00267791748046875, 0.0004062652587890625, 0.003490447998046875, 0.0065746307373046875, 0.0096588134765625, 0.012742996215820312, 0.015827178955078125, 0.018911361694335938, 0.02199554443359375, 0.025079727172851562, 0.028163909912109375, 0.031248092651367188, 0.034332275390625, 0.03741645812988281, 0.040500640869140625, 0.04358482360839844, 0.04666900634765625, 0.04975318908691406, 0.052837371826171875, 0.05592155456542969, 0.0590057373046875, 0.06208992004394531, 0.06517410278320312, 0.06825828552246094, 0.07134246826171875, 0.07442665100097656, 0.07751083374023438, 0.08059501647949219, 0.08367919921875]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [4.0, 5.0, 85.0, 678.0, 219.0, 25.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0032518741209059954, -0.002353122690692544, -0.0014543713768944144, -0.0005556200630962849, 0.0003431313671171665, 0.0012418825644999743, 0.0021406339947134256, 0.003039385424926877, 0.003938136622309685, 0.004836888052523136, 0.0057356394827365875, 0.006634390912950039, 0.00753314234316349, 0.008431892842054367, 0.009330645203590393, 0.01022939570248127, 0.011128148064017296, 0.012026899494230747, 0.012925650924444199, 0.01382440235465765, 0.014723153784871101, 0.015621904283761978, 0.016520656645298004, 0.01741940714418888, 0.018318159505724907, 0.019216910004615784, 0.02011566236615181, 0.021014412865042686, 0.021913165226578712, 0.02281191572546959, 0.023710668087005615, 0.024609418585896492, 0.025508170947432518, 0.026406921446323395, 0.02730567380785942, 0.028204424306750298, 0.029103176668286324, 0.0300019271671772, 0.030900679528713226, 0.03179943189024925, 0.03269818052649498, 0.033596932888031006, 0.03449568152427673, 0.03539443388581276, 0.036293186247348785, 0.03719193860888481, 0.03809068724513054, 0.038989439606666565, 0.03988819196820259, 0.04078694432973862, 0.041685692965984344, 0.04258444532752037, 0.043483197689056396, 0.04438195005059242, 0.04528069868683815, 0.046179451048374176, 0.0470782034099102, 0.04797695577144623, 0.048875704407691956, 0.04977445676922798, 0.05067320913076401, 0.051571961492300034, 0.05247071012854576, 0.05336946249008179, 0.05426821485161781]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 8.0, 5.0, 5.0, 14.0, 15.0, 12.0, 23.0, 26.0, 31.0, 32.0, 42.0, 38.0, 31.0, 37.0, 47.0, 54.0, 64.0, 55.0, 57.0, 54.0, 57.0, 47.0, 46.0, 36.0, 34.0, 23.0, 23.0, 26.0, 10.0, 8.0, 15.0, 7.0, 9.0, 6.0, 4.0, 0.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.004744350910186768, -0.004613455384969711, -0.004482559859752655, -0.004351664334535599, -0.0042207688093185425, -0.004089873284101486, -0.00395897775888443, -0.0038280822336673737, -0.0036971867084503174, -0.003566291183233261, -0.003435395658016205, -0.0033045001327991486, -0.0031736046075820923, -0.003042709082365036, -0.0029118135571479797, -0.0027809180319309235, -0.002650022506713867, -0.002519126981496811, -0.0023882314562797546, -0.0022573359310626984, -0.002126440405845642, -0.001995544880628586, -0.0018646493554115295, -0.0017337538301944733, -0.001602858304977417, -0.0014719627797603607, -0.0013410672545433044, -0.0012101717293262482, -0.001079276204109192, -0.0009483806788921356, -0.0008174851536750793, -0.0006865896284580231, -0.0005556941032409668, -0.0004247985780239105, -0.00029390305280685425, -0.00016300752758979797, -3.21120023727417e-05, 9.878352284431458e-05, 0.00022967904806137085, 0.0003605745732784271, 0.0004914700984954834, 0.0006223656237125397, 0.000753261148929596, 0.0008841566741466522, 0.0010150521993637085, 0.0011459477245807648, 0.001276843249797821, 0.0014077387750148773, 0.0015386343002319336, 0.0016695298254489899, 0.0018004253506660461, 0.0019313208758831024, 0.0020622164011001587, 0.002193111926317215, 0.0023240074515342712, 0.0024549029767513275, 0.002585798501968384, 0.00271669402718544, 0.0028475895524024963, 0.0029784850776195526, 0.003109380602836609, 0.003240276128053665, 0.0033711716532707214, 0.0035020671784877777, 0.003632962703704834]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 6.0, 13.0, 10.0, 6.0, 8.0, 11.0, 22.0, 15.0, 25.0, 22.0, 17.0, 21.0, 26.0, 31.0, 34.0, 36.0, 47.0, 40.0, 29.0, 44.0, 41.0, 32.0, 44.0, 43.0, 38.0, 34.0, 34.0, 37.0, 28.0, 25.0, 28.0, 20.0, 22.0, 21.0, 16.0, 17.0, 4.0, 7.0, 13.0, 4.0, 9.0, 6.0, 3.0, 5.0, 4.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.26171875, -5.07354736328125, -4.8853759765625, -4.69720458984375, -4.509033203125, -4.32086181640625, -4.1326904296875, -3.94451904296875, -3.75634765625, -3.56817626953125, -3.3800048828125, -3.19183349609375, -3.003662109375, -2.81549072265625, -2.6273193359375, -2.43914794921875, -2.2509765625, -2.06280517578125, -1.8746337890625, -1.68646240234375, -1.498291015625, -1.31011962890625, -1.1219482421875, -0.93377685546875, -0.74560546875, -0.55743408203125, -0.3692626953125, -0.18109130859375, 0.007080078125, 0.19525146484375, 0.3834228515625, 0.57159423828125, 0.759765625, 0.94793701171875, 1.1361083984375, 1.32427978515625, 1.512451171875, 1.70062255859375, 1.8887939453125, 2.07696533203125, 2.26513671875, 2.45330810546875, 2.6414794921875, 2.82965087890625, 3.017822265625, 3.20599365234375, 3.3941650390625, 3.58233642578125, 3.7705078125, 3.95867919921875, 4.1468505859375, 4.33502197265625, 4.523193359375, 4.71136474609375, 4.8995361328125, 5.08770751953125, 5.27587890625, 5.46405029296875, 5.6522216796875, 5.84039306640625, 6.028564453125, 6.21673583984375, 6.4049072265625, 6.59307861328125, 6.78125]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 0.0, 5.0, 5.0, 3.0, 7.0, 7.0, 9.0, 18.0, 23.0, 37.0, 43.0, 51.0, 85.0, 112.0, 200.0, 268.0, 480.0, 791.0, 1395.0, 2436.0, 4623.0, 8854.0, 18548.0, 43427.0, 120629.0, 387109.0, 298168.0, 93773.0, 35318.0, 15425.0, 7420.0, 3983.0, 2167.0, 1195.0, 722.0, 429.0, 251.0, 183.0, 111.0, 72.0, 58.0, 37.0, 28.0, 16.0, 17.0, 9.0, 9.0, 4.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.66015625, -4.50421142578125, -4.3482666015625, -4.19232177734375, -4.036376953125, -3.88043212890625, -3.7244873046875, -3.56854248046875, -3.41259765625, -3.25665283203125, -3.1007080078125, -2.94476318359375, -2.788818359375, -2.63287353515625, -2.4769287109375, -2.32098388671875, -2.1650390625, -2.00909423828125, -1.8531494140625, -1.69720458984375, -1.541259765625, -1.38531494140625, -1.2293701171875, -1.07342529296875, -0.91748046875, -0.76153564453125, -0.6055908203125, -0.44964599609375, -0.293701171875, -0.13775634765625, 0.0181884765625, 0.17413330078125, 0.330078125, 0.48602294921875, 0.6419677734375, 0.79791259765625, 0.953857421875, 1.10980224609375, 1.2657470703125, 1.42169189453125, 1.57763671875, 1.73358154296875, 1.8895263671875, 2.04547119140625, 2.201416015625, 2.35736083984375, 2.5133056640625, 2.66925048828125, 2.8251953125, 2.98114013671875, 3.1370849609375, 3.29302978515625, 3.448974609375, 3.60491943359375, 3.7608642578125, 3.91680908203125, 4.07275390625, 4.22869873046875, 4.3846435546875, 4.54058837890625, 4.696533203125, 4.85247802734375, 5.0084228515625, 5.16436767578125, 5.3203125]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 4.0, 7.0, 4.0, 11.0, 4.0, 12.0, 14.0, 17.0, 12.0, 15.0, 14.0, 21.0, 22.0, 20.0, 29.0, 34.0, 25.0, 43.0, 30.0, 54.0, 83.0, 235.0, 1648.0, 194.0, 67.0, 54.0, 48.0, 38.0, 39.0, 28.0, 30.0, 24.0, 32.0, 22.0, 17.0, 18.0, 11.0, 11.0, 18.0, 12.0, 8.0, 8.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-19.59375, -19.008056640625, -18.42236328125, -17.836669921875, -17.2509765625, -16.665283203125, -16.07958984375, -15.493896484375, -14.908203125, -14.322509765625, -13.73681640625, -13.151123046875, -12.5654296875, -11.979736328125, -11.39404296875, -10.808349609375, -10.22265625, -9.636962890625, -9.05126953125, -8.465576171875, -7.8798828125, -7.294189453125, -6.70849609375, -6.122802734375, -5.537109375, -4.951416015625, -4.36572265625, -3.780029296875, -3.1943359375, -2.608642578125, -2.02294921875, -1.437255859375, -0.8515625, -0.265869140625, 0.31982421875, 0.905517578125, 1.4912109375, 2.076904296875, 2.66259765625, 3.248291015625, 3.833984375, 4.419677734375, 5.00537109375, 5.591064453125, 6.1767578125, 6.762451171875, 7.34814453125, 7.933837890625, 8.51953125, 9.105224609375, 9.69091796875, 10.276611328125, 10.8623046875, 11.447998046875, 12.03369140625, 12.619384765625, 13.205078125, 13.790771484375, 14.37646484375, 14.962158203125, 15.5478515625, 16.133544921875, 16.71923828125, 17.304931640625, 17.890625]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 4.0, 3.0, 4.0, 6.0, 6.0, 5.0, 13.0, 11.0, 16.0, 28.0, 35.0, 43.0, 59.0, 87.0, 122.0, 172.0, 236.0, 362.0, 653.0, 7978.0, 3091226.0, 42388.0, 932.0, 392.0, 246.0, 181.0, 128.0, 86.0, 64.0, 50.0, 42.0, 30.0, 28.0, 15.0, 16.0, 13.0, 8.0, 4.0, 4.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-64.1875, -62.3876953125, -60.587890625, -58.7880859375, -56.98828125, -55.1884765625, -53.388671875, -51.5888671875, -49.7890625, -47.9892578125, -46.189453125, -44.3896484375, -42.58984375, -40.7900390625, -38.990234375, -37.1904296875, -35.390625, -33.5908203125, -31.791015625, -29.9912109375, -28.19140625, -26.3916015625, -24.591796875, -22.7919921875, -20.9921875, -19.1923828125, -17.392578125, -15.5927734375, -13.79296875, -11.9931640625, -10.193359375, -8.3935546875, -6.59375, -4.7939453125, -2.994140625, -1.1943359375, 0.60546875, 2.4052734375, 4.205078125, 6.0048828125, 7.8046875, 9.6044921875, 11.404296875, 13.2041015625, 15.00390625, 16.8037109375, 18.603515625, 20.4033203125, 22.203125, 24.0029296875, 25.802734375, 27.6025390625, 29.40234375, 31.2021484375, 33.001953125, 34.8017578125, 36.6015625, 38.4013671875, 40.201171875, 42.0009765625, 43.80078125, 45.6005859375, 47.400390625, 49.2001953125, 51.0]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [3.0, 4.0, 41.0, 400.0, 483.0, 82.0, 6.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.019357681274414, -9.892585754394531, -6.76581335067749, -3.639040946960449, -0.5122690200805664, 2.6145029067993164, 5.741275787353516, 8.868047714233398, 11.994819641113281, 15.121591567993164, 18.248363494873047, 21.375137329101562, 24.501907348632812, 27.628681182861328, 30.75545310974121, 33.882225036621094, 37.008995056152344, 40.13576889038086, 43.26253890991211, 46.389312744140625, 49.516082763671875, 52.64285659790039, 55.769630432128906, 58.896400451660156, 62.02317428588867, 65.14994812011719, 68.27671813964844, 71.40348815917969, 74.53026580810547, 77.65703582763672, 80.78380584716797, 83.91058349609375, 87.03734588623047, 90.16411590576172, 93.2908935546875, 96.41766357421875, 99.54443359375, 102.67120361328125, 105.79798126220703, 108.92475128173828, 112.05152130126953, 115.17829132080078, 118.30506896972656, 121.43183898925781, 124.55860900878906, 127.68537902832031, 130.81214904785156, 133.93893432617188, 137.06570434570312, 140.19247436523438, 143.31924438476562, 146.44601440429688, 149.5727996826172, 152.69956970214844, 155.8263397216797, 158.95310974121094, 162.0798797607422, 165.20664978027344, 168.3334197998047, 171.46018981933594, 174.58697509765625, 177.7137451171875, 180.84051513671875, 183.96728515625, 187.09405517578125]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 5.0, 5.0, 14.0, 4.0, 12.0, 14.0, 12.0, 16.0, 22.0, 22.0, 28.0, 27.0, 32.0, 32.0, 33.0, 54.0, 44.0, 40.0, 55.0, 34.0, 66.0, 52.0, 44.0, 43.0, 31.0, 41.0, 34.0, 24.0, 38.0, 33.0, 23.0, 17.0, 14.0, 10.0, 8.0, 6.0, 6.0, 4.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.58349609375, -51.70321273803711, -49.82292556762695, -47.94264221191406, -46.062355041503906, -44.182071685791016, -42.301788330078125, -40.42150115966797, -38.54121780395508, -36.66093444824219, -34.78064727783203, -32.90036392211914, -31.020078659057617, -29.139793395996094, -27.25950813293457, -25.379222869873047, -23.498937606811523, -21.61865234375, -19.738367080688477, -17.858081817626953, -15.977798461914062, -14.097513198852539, -12.217227935791016, -10.336943626403809, -8.456658363342285, -6.57637357711792, -4.696088790893555, -2.8158035278320312, -0.935518741607666, 0.9447660446166992, 2.8250513076782227, 4.70533561706543, 6.585620880126953, 8.465906143188477, 10.346190452575684, 12.226475715637207, 14.106760025024414, 15.987045288085938, 17.86733055114746, 19.747615814208984, 21.627899169921875, 23.5081844329834, 25.388469696044922, 27.268753051757812, 29.149038314819336, 31.02932357788086, 32.90960693359375, 34.789894104003906, 36.67018127441406, 38.55046463012695, 40.43075180053711, 42.31103515625, 44.191322326660156, 46.07160568237305, 47.95188903808594, 49.832176208496094, 51.712459564208984, 53.592742919921875, 55.47303009033203, 57.35331344604492, 59.23360061645508, 61.11388397216797, 62.994171142578125, 64.87445068359375, 66.7547378540039]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 9.0, 9.0, 9.0, 11.0, 10.0, 6.0, 10.0, 20.0, 27.0, 19.0, 17.0, 23.0, 25.0, 40.0, 36.0, 38.0, 34.0, 35.0, 40.0, 44.0, 38.0, 50.0, 40.0, 38.0, 33.0, 34.0, 40.0, 36.0, 24.0, 25.0, 30.0, 21.0, 19.0, 15.0, 21.0, 15.0, 9.0, 12.0, 6.0, 9.0, 2.0, 7.0, 7.0, 5.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.57421875, -5.37542724609375, -5.1766357421875, -4.97784423828125, -4.779052734375, -4.58026123046875, -4.3814697265625, -4.18267822265625, -3.98388671875, -3.78509521484375, -3.5863037109375, -3.38751220703125, -3.188720703125, -2.98992919921875, -2.7911376953125, -2.59234619140625, -2.3935546875, -2.19476318359375, -1.9959716796875, -1.79718017578125, -1.598388671875, -1.39959716796875, -1.2008056640625, -1.00201416015625, -0.80322265625, -0.60443115234375, -0.4056396484375, -0.20684814453125, -0.008056640625, 0.19073486328125, 0.3895263671875, 0.58831787109375, 0.787109375, 0.98590087890625, 1.1846923828125, 1.38348388671875, 1.582275390625, 1.78106689453125, 1.9798583984375, 2.17864990234375, 2.37744140625, 2.57623291015625, 2.7750244140625, 2.97381591796875, 3.172607421875, 3.37139892578125, 3.5701904296875, 3.76898193359375, 3.9677734375, 4.16656494140625, 4.3653564453125, 4.56414794921875, 4.762939453125, 4.96173095703125, 5.1605224609375, 5.35931396484375, 5.55810546875, 5.75689697265625, 5.9556884765625, 6.15447998046875, 6.353271484375, 6.55206298828125, 6.7508544921875, 6.94964599609375, 7.1484375]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 6.0, 2.0, 8.0, 14.0, 8.0, 10.0, 4.0, 16.0, 18.0, 15.0, 19.0, 32.0, 28.0, 55.0, 97.0, 199.0, 411.0, 836.0, 2198.0, 7793.0, 50624.0, 836289.0, 2848255.0, 411251.0, 27704.0, 5316.0, 1644.0, 659.0, 297.0, 139.0, 97.0, 60.0, 39.0, 31.0, 34.0, 13.0, 9.0, 11.0, 9.0, 6.0, 7.0, 10.0, 6.0, 4.0, 4.0, 3.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.140625, -13.6044921875, -13.068359375, -12.5322265625, -11.99609375, -11.4599609375, -10.923828125, -10.3876953125, -9.8515625, -9.3154296875, -8.779296875, -8.2431640625, -7.70703125, -7.1708984375, -6.634765625, -6.0986328125, -5.5625, -5.0263671875, -4.490234375, -3.9541015625, -3.41796875, -2.8818359375, -2.345703125, -1.8095703125, -1.2734375, -0.7373046875, -0.201171875, 0.3349609375, 0.87109375, 1.4072265625, 1.943359375, 2.4794921875, 3.015625, 3.5517578125, 4.087890625, 4.6240234375, 5.16015625, 5.6962890625, 6.232421875, 6.7685546875, 7.3046875, 7.8408203125, 8.376953125, 8.9130859375, 9.44921875, 9.9853515625, 10.521484375, 11.0576171875, 11.59375, 12.1298828125, 12.666015625, 13.2021484375, 13.73828125, 14.2744140625, 14.810546875, 15.3466796875, 15.8828125, 16.4189453125, 16.955078125, 17.4912109375, 18.02734375, 18.5634765625, 19.099609375, 19.6357421875, 20.171875]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 7.0, 3.0, 7.0, 8.0, 7.0, 13.0, 14.0, 29.0, 24.0, 43.0, 37.0, 57.0, 69.0, 102.0, 145.0, 135.0, 216.0, 295.0, 341.0, 403.0, 413.0, 393.0, 311.0, 251.0, 166.0, 145.0, 109.0, 86.0, 52.0, 51.0, 33.0, 35.0, 20.0, 18.0, 8.0, 8.0, 8.0, 4.0, 4.0, 2.0, 5.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.3203125, -8.9642333984375, -8.608154296875, -8.2520751953125, -7.89599609375, -7.5399169921875, -7.183837890625, -6.8277587890625, -6.4716796875, -6.1156005859375, -5.759521484375, -5.4034423828125, -5.04736328125, -4.6912841796875, -4.335205078125, -3.9791259765625, -3.623046875, -3.2669677734375, -2.910888671875, -2.5548095703125, -2.19873046875, -1.8426513671875, -1.486572265625, -1.1304931640625, -0.7744140625, -0.4183349609375, -0.062255859375, 0.2938232421875, 0.64990234375, 1.0059814453125, 1.362060546875, 1.7181396484375, 2.07421875, 2.4302978515625, 2.786376953125, 3.1424560546875, 3.49853515625, 3.8546142578125, 4.210693359375, 4.5667724609375, 4.9228515625, 5.2789306640625, 5.635009765625, 5.9910888671875, 6.34716796875, 6.7032470703125, 7.059326171875, 7.4154052734375, 7.771484375, 8.1275634765625, 8.483642578125, 8.8397216796875, 9.19580078125, 9.5518798828125, 9.907958984375, 10.2640380859375, 10.6201171875, 10.9761962890625, 11.332275390625, 11.6883544921875, 12.04443359375, 12.4005126953125, 12.756591796875, 13.1126708984375, 13.46875]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 6.0, 10.0, 7.0, 7.0, 7.0, 16.0, 25.0, 24.0, 34.0, 55.0, 67.0, 55.0, 90.0, 101.0, 131.0, 169.0, 250.0, 329.0, 617.0, 4472.0, 229493.0, 3860920.0, 92858.0, 2607.0, 558.0, 300.0, 234.0, 178.0, 149.0, 93.0, 90.0, 77.0, 56.0, 40.0, 28.0, 35.0, 19.0, 21.0, 14.0, 10.0, 9.0, 9.0, 3.0, 6.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-46.28125, -44.93603515625, -43.5908203125, -42.24560546875, -40.900390625, -39.55517578125, -38.2099609375, -36.86474609375, -35.51953125, -34.17431640625, -32.8291015625, -31.48388671875, -30.138671875, -28.79345703125, -27.4482421875, -26.10302734375, -24.7578125, -23.41259765625, -22.0673828125, -20.72216796875, -19.376953125, -18.03173828125, -16.6865234375, -15.34130859375, -13.99609375, -12.65087890625, -11.3056640625, -9.96044921875, -8.615234375, -7.27001953125, -5.9248046875, -4.57958984375, -3.234375, -1.88916015625, -0.5439453125, 0.80126953125, 2.146484375, 3.49169921875, 4.8369140625, 6.18212890625, 7.52734375, 8.87255859375, 10.2177734375, 11.56298828125, 12.908203125, 14.25341796875, 15.5986328125, 16.94384765625, 18.2890625, 19.63427734375, 20.9794921875, 22.32470703125, 23.669921875, 25.01513671875, 26.3603515625, 27.70556640625, 29.05078125, 30.39599609375, 31.7412109375, 33.08642578125, 34.431640625, 35.77685546875, 37.1220703125, 38.46728515625, 39.8125]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 14.0, 27.0, 47.0, 74.0, 132.0, 157.0, 147.0, 126.0, 129.0, 76.0, 42.0, 20.0, 5.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.3076171875, -63.020355224609375, -60.73309326171875, -58.445831298828125, -56.1585693359375, -53.871307373046875, -51.58404541015625, -49.296783447265625, -47.009521484375, -44.722259521484375, -42.43499755859375, -40.147735595703125, -37.8604736328125, -35.573211669921875, -33.28594970703125, -30.998687744140625, -28.71142578125, -26.424163818359375, -24.13690185546875, -21.849639892578125, -19.5623779296875, -17.275115966796875, -14.98785400390625, -12.700592041015625, -10.413330078125, -8.126068115234375, -5.83880615234375, -3.551544189453125, -1.2642822265625, 1.022979736328125, 3.31024169921875, 5.597503662109375, 7.884765625, 10.172027587890625, 12.45928955078125, 14.746551513671875, 17.0338134765625, 19.321075439453125, 21.60833740234375, 23.895599365234375, 26.182861328125, 28.470123291015625, 30.75738525390625, 33.044647216796875, 35.3319091796875, 37.619171142578125, 39.90643310546875, 42.193695068359375, 44.48095703125, 46.768218994140625, 49.05548095703125, 51.342742919921875, 53.6300048828125, 55.917266845703125, 58.20452880859375, 60.491790771484375, 62.779052734375, 65.06631469726562, 67.35357666015625, 69.64083862304688, 71.9281005859375, 74.21536254882812, 76.50262451171875, 78.78988647460938, 81.0771484375]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 3.0, 5.0, 5.0, 7.0, 6.0, 11.0, 15.0, 23.0, 21.0, 17.0, 15.0, 24.0, 28.0, 20.0, 48.0, 27.0, 34.0, 36.0, 41.0, 50.0, 40.0, 38.0, 40.0, 36.0, 43.0, 38.0, 40.0, 31.0, 36.0, 37.0, 31.0, 27.0, 17.0, 19.0, 18.0, 18.0, 7.0, 12.0, 12.0, 5.0, 5.0, 2.0, 3.0, 5.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-39.99188232421875, -38.7181282043457, -37.44437026977539, -36.170616149902344, -34.89685821533203, -33.623104095458984, -32.34934997558594, -31.075593948364258, -29.801837921142578, -28.5280818939209, -27.25432586669922, -25.980571746826172, -24.706815719604492, -23.433059692382812, -22.159305572509766, -20.885549545288086, -19.611793518066406, -18.338037490844727, -17.064281463623047, -15.79052734375, -14.51677131652832, -13.24301528930664, -11.969260215759277, -10.695505142211914, -9.421749114990234, -8.147993087768555, -6.874238014221191, -5.60048246383667, -4.326726913452148, -3.052971363067627, -1.7792158126831055, -0.5054607391357422, 0.7682952880859375, 2.042050838470459, 3.3158063888549805, 4.589561939239502, 5.863317489624023, 7.137073040008545, 8.410828590393066, 9.68458366394043, 10.95833969116211, 12.232095718383789, 13.505850791931152, 14.779605865478516, 16.053361892700195, 17.327117919921875, 18.600872039794922, 19.8746280670166, 21.14838409423828, 22.42214012145996, 23.69589614868164, 24.969650268554688, 26.243406295776367, 27.517162322998047, 28.790916442871094, 30.064672470092773, 31.338428497314453, 32.6121826171875, 33.88594055175781, 35.15969467163086, 36.433448791503906, 37.70720672607422, 38.980960845947266, 40.25471496582031, 41.528472900390625]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 5.0, 2.0, 9.0, 3.0, 13.0, 11.0, 11.0, 11.0, 17.0, 16.0, 24.0, 30.0, 21.0, 20.0, 34.0, 27.0, 34.0, 51.0, 33.0, 48.0, 48.0, 42.0, 44.0, 47.0, 32.0, 34.0, 42.0, 27.0, 30.0, 35.0, 32.0, 23.0, 16.0, 21.0, 20.0, 21.0, 13.0, 12.0, 8.0, 10.0, 8.0, 3.0, 3.0, 6.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.8125, -5.6124267578125, -5.412353515625, -5.2122802734375, -5.01220703125, -4.8121337890625, -4.612060546875, -4.4119873046875, -4.2119140625, -4.0118408203125, -3.811767578125, -3.6116943359375, -3.41162109375, -3.2115478515625, -3.011474609375, -2.8114013671875, -2.611328125, -2.4112548828125, -2.211181640625, -2.0111083984375, -1.81103515625, -1.6109619140625, -1.410888671875, -1.2108154296875, -1.0107421875, -0.8106689453125, -0.610595703125, -0.4105224609375, -0.21044921875, -0.0103759765625, 0.189697265625, 0.3897705078125, 0.58984375, 0.7899169921875, 0.989990234375, 1.1900634765625, 1.39013671875, 1.5902099609375, 1.790283203125, 1.9903564453125, 2.1904296875, 2.3905029296875, 2.590576171875, 2.7906494140625, 2.99072265625, 3.1907958984375, 3.390869140625, 3.5909423828125, 3.791015625, 3.9910888671875, 4.191162109375, 4.3912353515625, 4.59130859375, 4.7913818359375, 4.991455078125, 5.1915283203125, 5.3916015625, 5.5916748046875, 5.791748046875, 5.9918212890625, 6.19189453125, 6.3919677734375, 6.592041015625, 6.7921142578125, 6.9921875]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 3.0, 3.0, 5.0, 5.0, 13.0, 19.0, 26.0, 31.0, 70.0, 78.0, 110.0, 144.0, 218.0, 341.0, 498.0, 766.0, 1303.0, 1857.0, 2991.0, 4596.0, 7614.0, 11941.0, 19602.0, 32285.0, 52291.0, 85690.0, 137511.0, 189870.0, 179952.0, 122308.0, 76040.0, 46355.0, 27897.0, 17194.0, 10700.0, 6607.0, 4202.0, 2504.0, 1657.0, 1151.0, 701.0, 440.0, 302.0, 210.0, 147.0, 108.0, 62.0, 48.0, 27.0, 22.0, 21.0, 3.0, 14.0, 4.0, 7.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.6435546875, -0.62200927734375, -0.6004638671875, -0.57891845703125, -0.557373046875, -0.53582763671875, -0.5142822265625, -0.49273681640625, -0.47119140625, -0.44964599609375, -0.4281005859375, -0.40655517578125, -0.385009765625, -0.36346435546875, -0.3419189453125, -0.32037353515625, -0.298828125, -0.27728271484375, -0.2557373046875, -0.23419189453125, -0.212646484375, -0.19110107421875, -0.1695556640625, -0.14801025390625, -0.12646484375, -0.10491943359375, -0.0833740234375, -0.06182861328125, -0.040283203125, -0.01873779296875, 0.0028076171875, 0.02435302734375, 0.0458984375, 0.06744384765625, 0.0889892578125, 0.11053466796875, 0.132080078125, 0.15362548828125, 0.1751708984375, 0.19671630859375, 0.21826171875, 0.23980712890625, 0.2613525390625, 0.28289794921875, 0.304443359375, 0.32598876953125, 0.3475341796875, 0.36907958984375, 0.390625, 0.41217041015625, 0.4337158203125, 0.45526123046875, 0.476806640625, 0.49835205078125, 0.5198974609375, 0.54144287109375, 0.56298828125, 0.58453369140625, 0.6060791015625, 0.62762451171875, 0.649169921875, 0.67071533203125, 0.6922607421875, 0.71380615234375, 0.7353515625]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 4.0, 4.0, 5.0, 11.0, 10.0, 5.0, 5.0, 7.0, 14.0, 19.0, 20.0, 13.0, 21.0, 13.0, 22.0, 29.0, 25.0, 22.0, 34.0, 34.0, 38.0, 29.0, 32.0, 36.0, 43.0, 1058.0, 38.0, 32.0, 33.0, 27.0, 39.0, 41.0, 27.0, 27.0, 23.0, 26.0, 16.0, 28.0, 13.0, 22.0, 13.0, 11.0, 10.0, 6.0, 13.0, 12.0, 4.0, 6.0, 8.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 3.0], "bins": [-3.955078125, -3.83673095703125, -3.7183837890625, -3.60003662109375, -3.481689453125, -3.36334228515625, -3.2449951171875, -3.12664794921875, -3.00830078125, -2.88995361328125, -2.7716064453125, -2.65325927734375, -2.534912109375, -2.41656494140625, -2.2982177734375, -2.17987060546875, -2.0615234375, -1.94317626953125, -1.8248291015625, -1.70648193359375, -1.588134765625, -1.46978759765625, -1.3514404296875, -1.23309326171875, -1.11474609375, -0.99639892578125, -0.8780517578125, -0.75970458984375, -0.641357421875, -0.52301025390625, -0.4046630859375, -0.28631591796875, -0.16796875, -0.04962158203125, 0.0687255859375, 0.18707275390625, 0.305419921875, 0.42376708984375, 0.5421142578125, 0.66046142578125, 0.77880859375, 0.89715576171875, 1.0155029296875, 1.13385009765625, 1.252197265625, 1.37054443359375, 1.4888916015625, 1.60723876953125, 1.7255859375, 1.84393310546875, 1.9622802734375, 2.08062744140625, 2.198974609375, 2.31732177734375, 2.4356689453125, 2.55401611328125, 2.67236328125, 2.79071044921875, 2.9090576171875, 3.02740478515625, 3.145751953125, 3.26409912109375, 3.3824462890625, 3.50079345703125, 3.619140625]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 6.0, 11.0, 12.0, 26.0, 26.0, 54.0, 83.0, 121.0, 236.0, 364.0, 551.0, 990.0, 1532.0, 2555.0, 4221.0, 6958.0, 11293.0, 18404.0, 29953.0, 48489.0, 77285.0, 117860.0, 162251.0, 1220772.0, 139291.0, 94775.0, 61097.0, 37769.0, 23318.0, 14570.0, 8713.0, 5330.0, 3175.0, 1972.0, 1229.0, 747.0, 390.0, 260.0, 167.0, 88.0, 63.0, 44.0, 28.0, 16.0, 18.0, 8.0, 6.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.5322265625, -0.515716552734375, -0.49920654296875, -0.482696533203125, -0.4661865234375, -0.449676513671875, -0.43316650390625, -0.416656494140625, -0.400146484375, -0.383636474609375, -0.36712646484375, -0.350616455078125, -0.3341064453125, -0.317596435546875, -0.30108642578125, -0.284576416015625, -0.26806640625, -0.251556396484375, -0.23504638671875, -0.218536376953125, -0.2020263671875, -0.185516357421875, -0.16900634765625, -0.152496337890625, -0.135986328125, -0.119476318359375, -0.10296630859375, -0.086456298828125, -0.0699462890625, -0.053436279296875, -0.03692626953125, -0.020416259765625, -0.00390625, 0.012603759765625, 0.02911376953125, 0.045623779296875, 0.0621337890625, 0.078643798828125, 0.09515380859375, 0.111663818359375, 0.128173828125, 0.144683837890625, 0.16119384765625, 0.177703857421875, 0.1942138671875, 0.210723876953125, 0.22723388671875, 0.243743896484375, 0.26025390625, 0.276763916015625, 0.29327392578125, 0.309783935546875, 0.3262939453125, 0.342803955078125, 0.35931396484375, 0.375823974609375, 0.392333984375, 0.408843994140625, 0.42535400390625, 0.441864013671875, 0.4583740234375, 0.474884033203125, 0.49139404296875, 0.507904052734375, 0.5244140625]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 6.0, 14.0, 6.0, 4.0, 12.0, 8.0, 14.0, 32.0, 30.0, 21.0, 55.0, 48.0, 71.0, 81.0, 83.0, 77.0, 78.0, 81.0, 53.0, 57.0, 45.0, 30.0, 25.0, 16.0, 14.0, 9.0, 6.0, 6.0, 3.0, 5.0, 3.0, 3.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.005512237548828125, -0.005355119705200195, -0.005198001861572266, -0.005040884017944336, -0.004883766174316406, -0.0047266483306884766, -0.004569530487060547, -0.004412412643432617, -0.0042552947998046875, -0.004098176956176758, -0.003941059112548828, -0.0037839412689208984, -0.0036268234252929688, -0.003469705581665039, -0.0033125877380371094, -0.0031554698944091797, -0.00299835205078125, -0.0028412342071533203, -0.0026841163635253906, -0.002526998519897461, -0.0023698806762695312, -0.0022127628326416016, -0.002055644989013672, -0.0018985271453857422, -0.0017414093017578125, -0.0015842914581298828, -0.0014271736145019531, -0.0012700557708740234, -0.0011129379272460938, -0.0009558200836181641, -0.0007987022399902344, -0.0006415843963623047, -0.000484466552734375, -0.0003273487091064453, -0.00017023086547851562, -1.3113021850585938e-05, 0.00014400482177734375, 0.00030112266540527344, 0.0004582405090332031, 0.0006153583526611328, 0.0007724761962890625, 0.0009295940399169922, 0.0010867118835449219, 0.0012438297271728516, 0.0014009475708007812, 0.001558065414428711, 0.0017151832580566406, 0.0018723011016845703, 0.0020294189453125, 0.0021865367889404297, 0.0023436546325683594, 0.002500772476196289, 0.0026578903198242188, 0.0028150081634521484, 0.002972126007080078, 0.003129243850708008, 0.0032863616943359375, 0.003443479537963867, 0.003600597381591797, 0.0037577152252197266, 0.003914833068847656, 0.004071950912475586, 0.004229068756103516, 0.004386186599731445, 0.004543304443359375]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 9.0, 3.0, 8.0, 6.0, 5.0, 15.0, 19.0, 24.0, 35.0, 42.0, 76.0, 106.0, 164.0, 375.0, 3955.0, 1030283.0, 12376.0, 473.0, 190.0, 119.0, 77.0, 45.0, 41.0, 27.0, 16.0, 10.0, 10.0, 10.0, 9.0, 8.0, 7.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1015625, -0.09801101684570312, -0.09445953369140625, -0.09090805053710938, -0.0873565673828125, -0.08380508422851562, -0.08025360107421875, -0.07670211791992188, -0.073150634765625, -0.06959915161132812, -0.06604766845703125, -0.062496185302734375, -0.0589447021484375, -0.055393218994140625, -0.05184173583984375, -0.048290252685546875, -0.04473876953125, -0.041187286376953125, -0.03763580322265625, -0.034084320068359375, -0.0305328369140625, -0.026981353759765625, -0.02342987060546875, -0.019878387451171875, -0.016326904296875, -0.012775421142578125, -0.00922393798828125, -0.005672454833984375, -0.0021209716796875, 0.001430511474609375, 0.00498199462890625, 0.008533477783203125, 0.0120849609375, 0.015636444091796875, 0.01918792724609375, 0.022739410400390625, 0.0262908935546875, 0.029842376708984375, 0.03339385986328125, 0.036945343017578125, 0.040496826171875, 0.044048309326171875, 0.04759979248046875, 0.051151275634765625, 0.0547027587890625, 0.058254241943359375, 0.06180572509765625, 0.06535720825195312, 0.06890869140625, 0.07246017456054688, 0.07601165771484375, 0.07956314086914062, 0.0831146240234375, 0.08666610717773438, 0.09021759033203125, 0.09376907348632812, 0.097320556640625, 0.10087203979492188, 0.10442352294921875, 0.10797500610351562, 0.1115264892578125, 0.11507797241210938, 0.11862945556640625, 0.12218093872070312, 0.125732421875]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [33.0, 727.0, 244.0, 13.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015578450402244925, -0.0006737327785231173, 0.00021037948317825794, 0.001094491803087294, 0.0019786041229963303, 0.002862716093659401, 0.003746828529983759, 0.00463094050064683, 0.005515052936971188, 0.006399165373295546, 0.007283277343958616, 0.008167389780282974, 0.009051501750946045, 0.009935613721609116, 0.010819726623594761, 0.011703838594257832, 0.012587951496243477, 0.013472063466906548, 0.014356176368892193, 0.015240288339555264, 0.01612440124154091, 0.01700851321220398, 0.01789262518286705, 0.01877673715353012, 0.01966084912419319, 0.020544961094856262, 0.021429073065519333, 0.022313185036182404, 0.023197298869490623, 0.024081410840153694, 0.024965522810816765, 0.025849634781479836, 0.026733746752142906, 0.027617858722805977, 0.028501970693469048, 0.029386084526777267, 0.030270196497440338, 0.03115430846810341, 0.03203842043876648, 0.03292253240942955, 0.03380664438009262, 0.03469075635075569, 0.03557486832141876, 0.03645898029208183, 0.037343092262744904, 0.038227204233407974, 0.039111316204071045, 0.039995431900024414, 0.040879543870687485, 0.041763655841350555, 0.042647767812013626, 0.0435318797826767, 0.04441599175333977, 0.04530010372400284, 0.04618421941995621, 0.04706832766532898, 0.04795243963599205, 0.04883655160665512, 0.04972066357731819, 0.05060477554798126, 0.05148888751864433, 0.052372999489307404, 0.05325711518526077, 0.054141223430633545, 0.055025339126586914]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 4.0, 3.0, 6.0, 10.0, 13.0, 25.0, 27.0, 25.0, 36.0, 31.0, 44.0, 32.0, 38.0, 64.0, 59.0, 47.0, 48.0, 59.0, 58.0, 55.0, 45.0, 44.0, 39.0, 32.0, 24.0, 24.0, 20.0, 21.0, 19.0, 21.0, 15.0, 7.0, 2.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0031934380531311035, -0.0031006978824734688, -0.003007957711815834, -0.0029152175411581993, -0.0028224773705005646, -0.00272973719984293, -0.002636997029185295, -0.0025442568585276604, -0.0024515166878700256, -0.002358776517212391, -0.002266036346554756, -0.0021732961758971214, -0.0020805560052394867, -0.001987815834581852, -0.0018950756639242172, -0.0018023354932665825, -0.0017095953226089478, -0.001616855151951313, -0.0015241149812936783, -0.0014313748106360435, -0.0013386346399784088, -0.001245894469320774, -0.0011531542986631393, -0.0010604141280055046, -0.0009676739573478699, -0.0008749337866902351, -0.0007821936160326004, -0.0006894534453749657, -0.0005967132747173309, -0.0005039731040596962, -0.00041123293340206146, -0.00031849276274442673, -0.000225752592086792, -0.00013301242142915726, -4.027225077152252e-05, 5.246791988611221e-05, 0.00014520809054374695, 0.00023794826120138168, 0.0003306884318590164, 0.00042342860251665115, 0.0005161687731742859, 0.0006089089438319206, 0.0007016491144895554, 0.0007943892851471901, 0.0008871294558048248, 0.0009798696264624596, 0.0010726097971200943, 0.001165349967777729, 0.0012580901384353638, 0.0013508303090929985, 0.0014435704797506332, 0.001536310650408268, 0.0016290508210659027, 0.0017217909917235374, 0.0018145311623811722, 0.001907271333038807, 0.0020000115036964417, 0.0020927516743540764, 0.002185491845011711, 0.002278232015669346, 0.0023709721863269806, 0.0024637123569846153, 0.00255645252764225, 0.002649192698299885, 0.0027419328689575195]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 5.0, 2.0, 9.0, 3.0, 13.0, 11.0, 11.0, 11.0, 17.0, 16.0, 24.0, 30.0, 21.0, 20.0, 34.0, 27.0, 34.0, 51.0, 33.0, 48.0, 47.0, 43.0, 44.0, 47.0, 32.0, 34.0, 42.0, 27.0, 30.0, 35.0, 32.0, 23.0, 16.0, 21.0, 20.0, 21.0, 13.0, 12.0, 8.0, 10.0, 8.0, 3.0, 3.0, 6.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.8125, -5.6124267578125, -5.412353515625, -5.2122802734375, -5.01220703125, -4.8121337890625, -4.612060546875, -4.4119873046875, -4.2119140625, -4.0118408203125, -3.811767578125, -3.6116943359375, -3.41162109375, -3.2115478515625, -3.011474609375, -2.8114013671875, -2.611328125, -2.4112548828125, -2.211181640625, -2.0111083984375, -1.81103515625, -1.6109619140625, -1.410888671875, -1.2108154296875, -1.0107421875, -0.8106689453125, -0.610595703125, -0.4105224609375, -0.21044921875, -0.0103759765625, 0.189697265625, 0.3897705078125, 0.58984375, 0.7899169921875, 0.989990234375, 1.1900634765625, 1.39013671875, 1.5902099609375, 1.790283203125, 1.9903564453125, 2.1904296875, 2.3905029296875, 2.590576171875, 2.7906494140625, 2.99072265625, 3.1907958984375, 3.390869140625, 3.5909423828125, 3.791015625, 3.9910888671875, 4.191162109375, 4.3912353515625, 4.59130859375, 4.7913818359375, 4.991455078125, 5.1915283203125, 5.3916015625, 5.5916748046875, 5.791748046875, 5.9918212890625, 6.19189453125, 6.3919677734375, 6.592041015625, 6.7921142578125, 6.9921875]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 7.0, 4.0, 9.0, 7.0, 16.0, 15.0, 21.0, 24.0, 44.0, 39.0, 73.0, 128.0, 152.0, 252.0, 432.0, 787.0, 1481.0, 3160.0, 7529.0, 20845.0, 80455.0, 371038.0, 431717.0, 91772.0, 23355.0, 8045.0, 3340.0, 1693.0, 842.0, 446.0, 282.0, 168.0, 105.0, 68.0, 51.0, 37.0, 36.0, 22.0, 12.0, 16.0, 9.0, 4.0, 4.0, 6.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.60546875, -5.4124755859375, -5.219482421875, -5.0264892578125, -4.83349609375, -4.6405029296875, -4.447509765625, -4.2545166015625, -4.0615234375, -3.8685302734375, -3.675537109375, -3.4825439453125, -3.28955078125, -3.0965576171875, -2.903564453125, -2.7105712890625, -2.517578125, -2.3245849609375, -2.131591796875, -1.9385986328125, -1.74560546875, -1.5526123046875, -1.359619140625, -1.1666259765625, -0.9736328125, -0.7806396484375, -0.587646484375, -0.3946533203125, -0.20166015625, -0.0086669921875, 0.184326171875, 0.3773193359375, 0.5703125, 0.7633056640625, 0.956298828125, 1.1492919921875, 1.34228515625, 1.5352783203125, 1.728271484375, 1.9212646484375, 2.1142578125, 2.3072509765625, 2.500244140625, 2.6932373046875, 2.88623046875, 3.0792236328125, 3.272216796875, 3.4652099609375, 3.658203125, 3.8511962890625, 4.044189453125, 4.2371826171875, 4.43017578125, 4.6231689453125, 4.816162109375, 5.0091552734375, 5.2021484375, 5.3951416015625, 5.588134765625, 5.7811279296875, 5.97412109375, 6.1671142578125, 6.360107421875, 6.5531005859375, 6.74609375]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 7.0, 5.0, 11.0, 10.0, 8.0, 9.0, 11.0, 20.0, 17.0, 14.0, 19.0, 17.0, 31.0, 28.0, 29.0, 26.0, 38.0, 32.0, 52.0, 47.0, 89.0, 347.0, 1567.0, 139.0, 69.0, 41.0, 38.0, 35.0, 33.0, 30.0, 29.0, 40.0, 18.0, 22.0, 25.0, 22.0, 6.0, 10.0, 9.0, 5.0, 5.0, 11.0, 7.0, 8.0, 2.0, 5.0, 3.0, 4.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0], "bins": [-19.421875, -18.818359375, -18.21484375, -17.611328125, -17.0078125, -16.404296875, -15.80078125, -15.197265625, -14.59375, -13.990234375, -13.38671875, -12.783203125, -12.1796875, -11.576171875, -10.97265625, -10.369140625, -9.765625, -9.162109375, -8.55859375, -7.955078125, -7.3515625, -6.748046875, -6.14453125, -5.541015625, -4.9375, -4.333984375, -3.73046875, -3.126953125, -2.5234375, -1.919921875, -1.31640625, -0.712890625, -0.109375, 0.494140625, 1.09765625, 1.701171875, 2.3046875, 2.908203125, 3.51171875, 4.115234375, 4.71875, 5.322265625, 5.92578125, 6.529296875, 7.1328125, 7.736328125, 8.33984375, 8.943359375, 9.546875, 10.150390625, 10.75390625, 11.357421875, 11.9609375, 12.564453125, 13.16796875, 13.771484375, 14.375, 14.978515625, 15.58203125, 16.185546875, 16.7890625, 17.392578125, 17.99609375, 18.599609375, 19.203125]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 2.0, 5.0, 11.0, 16.0, 17.0, 19.0, 22.0, 36.0, 68.0, 105.0, 166.0, 266.0, 504.0, 1878.0, 2726368.0, 413560.0, 1536.0, 440.0, 246.0, 163.0, 87.0, 54.0, 41.0, 31.0, 21.0, 15.0, 13.0, 7.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.25, -73.7041015625, -71.158203125, -68.6123046875, -66.06640625, -63.5205078125, -60.974609375, -58.4287109375, -55.8828125, -53.3369140625, -50.791015625, -48.2451171875, -45.69921875, -43.1533203125, -40.607421875, -38.0615234375, -35.515625, -32.9697265625, -30.423828125, -27.8779296875, -25.33203125, -22.7861328125, -20.240234375, -17.6943359375, -15.1484375, -12.6025390625, -10.056640625, -7.5107421875, -4.96484375, -2.4189453125, 0.126953125, 2.6728515625, 5.21875, 7.7646484375, 10.310546875, 12.8564453125, 15.40234375, 17.9482421875, 20.494140625, 23.0400390625, 25.5859375, 28.1318359375, 30.677734375, 33.2236328125, 35.76953125, 38.3154296875, 40.861328125, 43.4072265625, 45.953125, 48.4990234375, 51.044921875, 53.5908203125, 56.13671875, 58.6826171875, 61.228515625, 63.7744140625, 66.3203125, 68.8662109375, 71.412109375, 73.9580078125, 76.50390625, 79.0498046875, 81.595703125, 84.1416015625, 86.6875]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 9.0, 26.0, 163.0, 310.0, 317.0, 137.0, 41.0, 7.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.58265686035156, -36.074092864990234, -34.56553268432617, -33.056968688964844, -31.54840850830078, -30.039846420288086, -28.53128433227539, -27.022720336914062, -25.51416015625, -24.005598068237305, -22.49703598022461, -20.988473892211914, -19.47991180419922, -17.971349716186523, -16.462787628173828, -14.954224586486816, -13.445661544799805, -11.93709945678711, -10.428537368774414, -8.919975280761719, -7.411412715911865, -5.90285062789917, -4.394288063049316, -2.885725975036621, -1.3771638870239258, 0.13139832019805908, 1.639960527420044, 3.1485228538513184, 4.657084941864014, 6.165647029876709, 7.6742095947265625, 9.182771682739258, 10.691333770751953, 12.199895858764648, 13.708457946777344, 15.217020034790039, 16.725582122802734, 18.23414421081543, 19.742706298828125, 21.251270294189453, 22.759830474853516, 24.26839256286621, 25.776954650878906, 27.2855167388916, 28.794078826904297, 30.302640914916992, 31.811203002929688, 33.319766998291016, 34.828330993652344, 36.33689498901367, 37.845455169677734, 39.35401916503906, 40.862579345703125, 42.37114334106445, 43.879703521728516, 45.388267517089844, 46.896827697753906, 48.405391693115234, 49.9139518737793, 51.422515869140625, 52.93107604980469, 54.439640045166016, 55.94820022583008, 57.456764221191406, 58.96532440185547]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 6.0, 6.0, 6.0, 7.0, 12.0, 14.0, 20.0, 15.0, 16.0, 16.0, 27.0, 28.0, 26.0, 44.0, 27.0, 38.0, 38.0, 46.0, 43.0, 44.0, 36.0, 53.0, 49.0, 40.0, 39.0, 43.0, 35.0, 26.0, 30.0, 24.0, 18.0, 24.0, 19.0, 18.0, 11.0, 12.0, 16.0, 6.0, 3.0, 6.0, 4.0, 5.0, 0.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.525245666503906, -54.71100616455078, -52.896766662597656, -51.08252716064453, -49.268287658691406, -47.45404815673828, -45.63980484008789, -43.825565338134766, -42.01132583618164, -40.197086334228516, -38.38284683227539, -36.568607330322266, -34.754364013671875, -32.94012451171875, -31.125885009765625, -29.3116455078125, -27.497406005859375, -25.68316650390625, -23.868927001953125, -22.054685592651367, -20.240446090698242, -18.426206588745117, -16.61196517944336, -14.797725677490234, -12.98348617553711, -11.169246673583984, -9.355006217956543, -7.54076623916626, -5.726526260375977, -3.9122867584228516, -2.09804630279541, -0.28380584716796875, 1.5304336547851562, 3.3446736335754395, 5.158913612365723, 6.973153591156006, 8.787393569946289, 10.601633071899414, 12.415873527526855, 14.230113983154297, 16.044353485107422, 17.858592987060547, 19.672832489013672, 21.48707389831543, 23.301313400268555, 25.11555290222168, 26.929794311523438, 28.744033813476562, 30.558273315429688, 32.37251281738281, 34.18675231933594, 36.00099182128906, 37.81523132324219, 39.62947082519531, 41.4437141418457, 43.25795364379883, 45.07219314575195, 46.88643264770508, 48.7006721496582, 50.51491165161133, 52.32915496826172, 54.143394470214844, 55.95763397216797, 57.771873474121094, 59.58611297607422]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 8.0, 1.0, 4.0, 9.0, 9.0, 11.0, 9.0, 20.0, 8.0, 14.0, 19.0, 25.0, 36.0, 23.0, 31.0, 32.0, 30.0, 43.0, 31.0, 61.0, 41.0, 41.0, 45.0, 52.0, 30.0, 39.0, 36.0, 33.0, 40.0, 25.0, 31.0, 28.0, 20.0, 24.0, 13.0, 17.0, 16.0, 13.0, 10.0, 5.0, 1.0, 6.0, 4.0, 6.0, 5.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.0859375, -5.8760986328125, -5.666259765625, -5.4564208984375, -5.24658203125, -5.0367431640625, -4.826904296875, -4.6170654296875, -4.4072265625, -4.1973876953125, -3.987548828125, -3.7777099609375, -3.56787109375, -3.3580322265625, -3.148193359375, -2.9383544921875, -2.728515625, -2.5186767578125, -2.308837890625, -2.0989990234375, -1.88916015625, -1.6793212890625, -1.469482421875, -1.2596435546875, -1.0498046875, -0.8399658203125, -0.630126953125, -0.4202880859375, -0.21044921875, -0.0006103515625, 0.209228515625, 0.4190673828125, 0.62890625, 0.8387451171875, 1.048583984375, 1.2584228515625, 1.46826171875, 1.6781005859375, 1.887939453125, 2.0977783203125, 2.3076171875, 2.5174560546875, 2.727294921875, 2.9371337890625, 3.14697265625, 3.3568115234375, 3.566650390625, 3.7764892578125, 3.986328125, 4.1961669921875, 4.406005859375, 4.6158447265625, 4.82568359375, 5.0355224609375, 5.245361328125, 5.4552001953125, 5.6650390625, 5.8748779296875, 6.084716796875, 6.2945556640625, 6.50439453125, 6.7142333984375, 6.924072265625, 7.1339111328125, 7.34375]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 2.0, 3.0, 14.0, 5.0, 10.0, 14.0, 17.0, 28.0, 22.0, 26.0, 39.0, 42.0, 48.0, 59.0, 79.0, 111.0, 175.0, 280.0, 718.0, 2210.0, 11054.0, 103648.0, 1550228.0, 2300031.0, 203154.0, 17149.0, 3107.0, 904.0, 361.0, 180.0, 129.0, 97.0, 81.0, 50.0, 40.0, 34.0, 27.0, 32.0, 19.0, 10.0, 11.0, 12.0, 7.0, 10.0, 4.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.8125, -13.28369140625, -12.7548828125, -12.22607421875, -11.697265625, -11.16845703125, -10.6396484375, -10.11083984375, -9.58203125, -9.05322265625, -8.5244140625, -7.99560546875, -7.466796875, -6.93798828125, -6.4091796875, -5.88037109375, -5.3515625, -4.82275390625, -4.2939453125, -3.76513671875, -3.236328125, -2.70751953125, -2.1787109375, -1.64990234375, -1.12109375, -0.59228515625, -0.0634765625, 0.46533203125, 0.994140625, 1.52294921875, 2.0517578125, 2.58056640625, 3.109375, 3.63818359375, 4.1669921875, 4.69580078125, 5.224609375, 5.75341796875, 6.2822265625, 6.81103515625, 7.33984375, 7.86865234375, 8.3974609375, 8.92626953125, 9.455078125, 9.98388671875, 10.5126953125, 11.04150390625, 11.5703125, 12.09912109375, 12.6279296875, 13.15673828125, 13.685546875, 14.21435546875, 14.7431640625, 15.27197265625, 15.80078125, 16.32958984375, 16.8583984375, 17.38720703125, 17.916015625, 18.44482421875, 18.9736328125, 19.50244140625, 20.03125]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 13.0, 12.0, 12.0, 19.0, 26.0, 51.0, 52.0, 56.0, 88.0, 98.0, 136.0, 166.0, 208.0, 292.0, 390.0, 456.0, 442.0, 378.0, 290.0, 225.0, 160.0, 128.0, 98.0, 62.0, 60.0, 34.0, 28.0, 33.0, 20.0, 10.0, 10.0, 5.0, 8.0, 4.0, 2.0, 0.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-13.4609375, -13.086181640625, -12.71142578125, -12.336669921875, -11.9619140625, -11.587158203125, -11.21240234375, -10.837646484375, -10.462890625, -10.088134765625, -9.71337890625, -9.338623046875, -8.9638671875, -8.589111328125, -8.21435546875, -7.839599609375, -7.46484375, -7.090087890625, -6.71533203125, -6.340576171875, -5.9658203125, -5.591064453125, -5.21630859375, -4.841552734375, -4.466796875, -4.092041015625, -3.71728515625, -3.342529296875, -2.9677734375, -2.593017578125, -2.21826171875, -1.843505859375, -1.46875, -1.093994140625, -0.71923828125, -0.344482421875, 0.0302734375, 0.405029296875, 0.77978515625, 1.154541015625, 1.529296875, 1.904052734375, 2.27880859375, 2.653564453125, 3.0283203125, 3.403076171875, 3.77783203125, 4.152587890625, 4.52734375, 4.902099609375, 5.27685546875, 5.651611328125, 6.0263671875, 6.401123046875, 6.77587890625, 7.150634765625, 7.525390625, 7.900146484375, 8.27490234375, 8.649658203125, 9.0244140625, 9.399169921875, 9.77392578125, 10.148681640625, 10.5234375]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 4.0, 9.0, 9.0, 13.0, 18.0, 31.0, 39.0, 32.0, 46.0, 71.0, 97.0, 102.0, 143.0, 160.0, 255.0, 303.0, 543.0, 2324.0, 153659.0, 3984583.0, 48541.0, 1483.0, 479.0, 292.0, 209.0, 198.0, 135.0, 116.0, 96.0, 64.0, 54.0, 52.0, 34.0, 25.0, 19.0, 10.0, 16.0, 4.0, 6.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.71875, -43.08642578125, -41.4541015625, -39.82177734375, -38.189453125, -36.55712890625, -34.9248046875, -33.29248046875, -31.66015625, -30.02783203125, -28.3955078125, -26.76318359375, -25.130859375, -23.49853515625, -21.8662109375, -20.23388671875, -18.6015625, -16.96923828125, -15.3369140625, -13.70458984375, -12.072265625, -10.43994140625, -8.8076171875, -7.17529296875, -5.54296875, -3.91064453125, -2.2783203125, -0.64599609375, 0.986328125, 2.61865234375, 4.2509765625, 5.88330078125, 7.515625, 9.14794921875, 10.7802734375, 12.41259765625, 14.044921875, 15.67724609375, 17.3095703125, 18.94189453125, 20.57421875, 22.20654296875, 23.8388671875, 25.47119140625, 27.103515625, 28.73583984375, 30.3681640625, 32.00048828125, 33.6328125, 35.26513671875, 36.8974609375, 38.52978515625, 40.162109375, 41.79443359375, 43.4267578125, 45.05908203125, 46.69140625, 48.32373046875, 49.9560546875, 51.58837890625, 53.220703125, 54.85302734375, 56.4853515625, 58.11767578125, 59.75]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 16.0, 127.0, 353.0, 378.0, 117.0, 20.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-119.40177154541016, -113.42817687988281, -107.45457458496094, -101.4809799194336, -95.50738525390625, -89.53378295898438, -83.56018829345703, -77.58659362792969, -71.61299133300781, -65.63939666748047, -59.66579818725586, -53.69219970703125, -47.718605041503906, -41.7450065612793, -35.77140808105469, -29.797813415527344, -23.82421875, -17.850622177124023, -11.87702465057373, -5.9034271240234375, 0.07016944885253906, 6.043766021728516, 12.017364501953125, 17.99095916748047, 23.964557647705078, 29.938154220581055, 35.91175079345703, 41.88534927368164, 47.85894775390625, 53.832542419433594, 59.8061408996582, 65.77973937988281, 71.75334167480469, 77.72693634033203, 83.7005386352539, 89.67413330078125, 95.6477279663086, 101.62132263183594, 107.59492492675781, 113.56851959228516, 119.5421142578125, 125.51570892333984, 131.4893035888672, 137.46290588378906, 143.43650817871094, 149.41009521484375, 155.38369750976562, 161.3572998046875, 167.33090209960938, 173.30450439453125, 179.27809143066406, 185.25169372558594, 191.2252960205078, 197.19888305664062, 203.1724853515625, 209.14608764648438, 215.1196746826172, 221.09327697753906, 227.06686401367188, 233.04046630859375, 239.01406860351562, 244.98765563964844, 250.9612579345703, 256.9348449707031, 262.908447265625]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 2.0, 9.0, 9.0, 13.0, 14.0, 15.0, 11.0, 19.0, 26.0, 27.0, 28.0, 24.0, 38.0, 32.0, 38.0, 51.0, 50.0, 42.0, 45.0, 42.0, 54.0, 42.0, 42.0, 35.0, 31.0, 40.0, 34.0, 30.0, 28.0, 21.0, 24.0, 16.0, 18.0, 7.0, 10.0, 13.0, 4.0, 5.0, 3.0, 2.0, 3.0, 6.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-49.3616943359375, -47.98292541503906, -46.60416030883789, -45.22539138793945, -43.84662628173828, -42.467857360839844, -41.089088439941406, -39.71031951904297, -38.3315544128418, -36.95278549194336, -35.57402038574219, -34.19525146484375, -32.81648254394531, -31.43771743774414, -30.058948516845703, -28.6801815032959, -27.301414489746094, -25.92264747619629, -24.543880462646484, -23.165111541748047, -21.786344528198242, -20.407577514648438, -19.02880859375, -17.650041580200195, -16.27127456665039, -14.892507553100586, -13.513739585876465, -12.134971618652344, -10.756204605102539, -9.377437591552734, -7.998669624328613, -6.619901657104492, -5.2411346435546875, -3.8623671531677246, -2.4835996627807617, -1.1048321723937988, 0.27393531799316406, 1.652702808380127, 3.03147029876709, 4.410238265991211, 5.789005279541016, 7.1677727699279785, 8.546540260314941, 9.925308227539062, 11.304075241088867, 12.682842254638672, 14.061610221862793, 15.440378189086914, 16.81914520263672, 18.197912216186523, 19.576679229736328, 20.955448150634766, 22.33421516418457, 23.712982177734375, 25.091751098632812, 26.470518112182617, 27.849285125732422, 29.228052139282227, 30.60681915283203, 31.98558807373047, 33.364356994628906, 34.74312210083008, 36.121891021728516, 37.50065612792969, 38.879425048828125]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 1.0, 4.0, 2.0, 7.0, 5.0, 9.0, 6.0, 12.0, 9.0, 11.0, 20.0, 16.0, 15.0, 16.0, 27.0, 28.0, 32.0, 34.0, 36.0, 40.0, 39.0, 33.0, 39.0, 46.0, 44.0, 49.0, 37.0, 29.0, 41.0, 29.0, 30.0, 34.0, 47.0, 24.0, 24.0, 11.0, 13.0, 26.0, 20.0, 16.0, 9.0, 7.0, 6.0, 5.0, 6.0, 6.0, 3.0, 4.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.5234375, -5.3228759765625, -5.122314453125, -4.9217529296875, -4.72119140625, -4.5206298828125, -4.320068359375, -4.1195068359375, -3.9189453125, -3.7183837890625, -3.517822265625, -3.3172607421875, -3.11669921875, -2.9161376953125, -2.715576171875, -2.5150146484375, -2.314453125, -2.1138916015625, -1.913330078125, -1.7127685546875, -1.51220703125, -1.3116455078125, -1.111083984375, -0.9105224609375, -0.7099609375, -0.5093994140625, -0.308837890625, -0.1082763671875, 0.09228515625, 0.2928466796875, 0.493408203125, 0.6939697265625, 0.89453125, 1.0950927734375, 1.295654296875, 1.4962158203125, 1.69677734375, 1.8973388671875, 2.097900390625, 2.2984619140625, 2.4990234375, 2.6995849609375, 2.900146484375, 3.1007080078125, 3.30126953125, 3.5018310546875, 3.702392578125, 3.9029541015625, 4.103515625, 4.3040771484375, 4.504638671875, 4.7052001953125, 4.90576171875, 5.1063232421875, 5.306884765625, 5.5074462890625, 5.7080078125, 5.9085693359375, 6.109130859375, 6.3096923828125, 6.51025390625, 6.7108154296875, 6.911376953125, 7.1119384765625, 7.3125]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 1.0, 4.0, 8.0, 7.0, 9.0, 17.0, 13.0, 41.0, 57.0, 58.0, 101.0, 155.0, 226.0, 282.0, 479.0, 760.0, 1077.0, 1703.0, 2625.0, 4058.0, 6268.0, 10183.0, 16396.0, 26203.0, 42071.0, 68373.0, 106964.0, 154932.0, 181413.0, 149102.0, 101952.0, 64911.0, 40696.0, 25227.0, 15575.0, 9709.0, 5865.0, 3936.0, 2393.0, 1551.0, 1005.0, 681.0, 501.0, 311.0, 211.0, 136.0, 84.0, 79.0, 45.0, 33.0, 27.0, 20.0, 10.0, 8.0, 6.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.63916015625, -0.61883544921875, -0.5985107421875, -0.57818603515625, -0.557861328125, -0.53753662109375, -0.5172119140625, -0.49688720703125, -0.4765625, -0.45623779296875, -0.4359130859375, -0.41558837890625, -0.395263671875, -0.37493896484375, -0.3546142578125, -0.33428955078125, -0.31396484375, -0.29364013671875, -0.2733154296875, -0.25299072265625, -0.232666015625, -0.21234130859375, -0.1920166015625, -0.17169189453125, -0.1513671875, -0.13104248046875, -0.1107177734375, -0.09039306640625, -0.070068359375, -0.04974365234375, -0.0294189453125, -0.00909423828125, 0.01123046875, 0.03155517578125, 0.0518798828125, 0.07220458984375, 0.092529296875, 0.11285400390625, 0.1331787109375, 0.15350341796875, 0.173828125, 0.19415283203125, 0.2144775390625, 0.23480224609375, 0.255126953125, 0.27545166015625, 0.2957763671875, 0.31610107421875, 0.33642578125, 0.35675048828125, 0.3770751953125, 0.39739990234375, 0.417724609375, 0.43804931640625, 0.4583740234375, 0.47869873046875, 0.4990234375, 0.51934814453125, 0.5396728515625, 0.55999755859375, 0.580322265625, 0.60064697265625, 0.6209716796875, 0.64129638671875, 0.66162109375]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 7.0, 6.0, 3.0, 14.0, 19.0, 12.0, 12.0, 14.0, 24.0, 27.0, 29.0, 24.0, 32.0, 42.0, 40.0, 37.0, 60.0, 43.0, 47.0, 1067.0, 52.0, 47.0, 35.0, 42.0, 40.0, 45.0, 41.0, 33.0, 21.0, 14.0, 25.0, 20.0, 16.0, 8.0, 2.0, 7.0, 5.0, 3.0, 4.0, 6.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-5.0546875, -4.91143798828125, -4.7681884765625, -4.62493896484375, -4.481689453125, -4.33843994140625, -4.1951904296875, -4.05194091796875, -3.90869140625, -3.76544189453125, -3.6221923828125, -3.47894287109375, -3.335693359375, -3.19244384765625, -3.0491943359375, -2.90594482421875, -2.7626953125, -2.61944580078125, -2.4761962890625, -2.33294677734375, -2.189697265625, -2.04644775390625, -1.9031982421875, -1.75994873046875, -1.61669921875, -1.47344970703125, -1.3302001953125, -1.18695068359375, -1.043701171875, -0.90045166015625, -0.7572021484375, -0.61395263671875, -0.470703125, -0.32745361328125, -0.1842041015625, -0.04095458984375, 0.102294921875, 0.24554443359375, 0.3887939453125, 0.53204345703125, 0.67529296875, 0.81854248046875, 0.9617919921875, 1.10504150390625, 1.248291015625, 1.39154052734375, 1.5347900390625, 1.67803955078125, 1.8212890625, 1.96453857421875, 2.1077880859375, 2.25103759765625, 2.394287109375, 2.53753662109375, 2.6807861328125, 2.82403564453125, 2.96728515625, 3.11053466796875, 3.2537841796875, 3.39703369140625, 3.540283203125, 3.68353271484375, 3.8267822265625, 3.97003173828125, 4.11328125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 7.0, 13.0, 10.0, 15.0, 19.0, 59.0, 74.0, 135.0, 184.0, 333.0, 512.0, 909.0, 1331.0, 2290.0, 3638.0, 5870.0, 9420.0, 15302.0, 24481.0, 38759.0, 62394.0, 95587.0, 135797.0, 1212029.0, 157605.0, 117736.0, 78735.0, 50538.0, 31765.0, 19473.0, 12232.0, 7448.0, 4716.0, 2938.0, 1830.0, 1152.0, 681.0, 444.0, 249.0, 170.0, 97.0, 60.0, 37.0, 23.0, 15.0, 7.0, 6.0, 2.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.495361328125, -0.4797706604003906, -0.46417999267578125, -0.4485893249511719, -0.4329986572265625, -0.4174079895019531, -0.40181732177734375, -0.3862266540527344, -0.370635986328125, -0.3550453186035156, -0.33945465087890625, -0.3238639831542969, -0.3082733154296875, -0.2926826477050781, -0.27709197998046875, -0.2615013122558594, -0.24591064453125, -0.23031997680664062, -0.21472930908203125, -0.19913864135742188, -0.1835479736328125, -0.16795730590820312, -0.15236663818359375, -0.13677597045898438, -0.121185302734375, -0.10559463500976562, -0.09000396728515625, -0.07441329956054688, -0.0588226318359375, -0.043231964111328125, -0.02764129638671875, -0.012050628662109375, 0.0035400390625, 0.019130706787109375, 0.03472137451171875, 0.050312042236328125, 0.0659027099609375, 0.08149337768554688, 0.09708404541015625, 0.11267471313476562, 0.128265380859375, 0.14385604858398438, 0.15944671630859375, 0.17503738403320312, 0.1906280517578125, 0.20621871948242188, 0.22180938720703125, 0.23740005493164062, 0.25299072265625, 0.2685813903808594, 0.28417205810546875, 0.2997627258300781, 0.3153533935546875, 0.3309440612792969, 0.34653472900390625, 0.3621253967285156, 0.377716064453125, 0.3933067321777344, 0.40889739990234375, 0.4244880676269531, 0.4400787353515625, 0.4556694030761719, 0.47126007080078125, 0.4868507385253906, 0.50244140625]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 4.0, 5.0, 6.0, 2.0, 13.0, 13.0, 19.0, 21.0, 19.0, 20.0, 34.0, 48.0, 64.0, 69.0, 85.0, 78.0, 95.0, 67.0, 83.0, 40.0, 47.0, 38.0, 20.0, 23.0, 16.0, 11.0, 13.0, 11.0, 4.0, 7.0, 7.0, 5.0, 3.0, 4.0, 3.0, 3.0, 5.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.004192352294921875, -0.0040648579597473145, -0.003937363624572754, -0.0038098692893981934, -0.003682374954223633, -0.0035548806190490723, -0.0034273862838745117, -0.003299891948699951, -0.0031723976135253906, -0.00304490327835083, -0.0029174089431762695, -0.002789914608001709, -0.0026624202728271484, -0.002534925937652588, -0.0024074316024780273, -0.002279937267303467, -0.0021524429321289062, -0.0020249485969543457, -0.0018974542617797852, -0.0017699599266052246, -0.001642465591430664, -0.0015149712562561035, -0.001387476921081543, -0.0012599825859069824, -0.0011324882507324219, -0.0010049939155578613, -0.0008774995803833008, -0.0007500052452087402, -0.0006225109100341797, -0.0004950165748596191, -0.0003675222396850586, -0.00024002790451049805, -0.0001125335693359375, 1.4960765838623047e-05, 0.0001424551010131836, 0.00026994943618774414, 0.0003974437713623047, 0.0005249381065368652, 0.0006524324417114258, 0.0007799267768859863, 0.0009074211120605469, 0.0010349154472351074, 0.001162409782409668, 0.0012899041175842285, 0.001417398452758789, 0.0015448927879333496, 0.0016723871231079102, 0.0017998814582824707, 0.0019273757934570312, 0.002054870128631592, 0.0021823644638061523, 0.002309858798980713, 0.0024373531341552734, 0.002564847469329834, 0.0026923418045043945, 0.002819836139678955, 0.0029473304748535156, 0.003074824810028076, 0.0032023191452026367, 0.0033298134803771973, 0.003457307815551758, 0.0035848021507263184, 0.003712296485900879, 0.0038397908210754395, 0.00396728515625]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 4.0, 2.0, 1.0, 5.0, 2.0, 4.0, 0.0, 5.0, 8.0, 10.0, 6.0, 11.0, 11.0, 17.0, 21.0, 27.0, 32.0, 45.0, 63.0, 90.0, 135.0, 251.0, 993.0, 70357.0, 972484.0, 3038.0, 363.0, 203.0, 121.0, 76.0, 41.0, 32.0, 26.0, 24.0, 12.0, 14.0, 15.0, 3.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.083740234375, -0.08087348937988281, -0.07800674438476562, -0.07513999938964844, -0.07227325439453125, -0.06940650939941406, -0.06653976440429688, -0.06367301940917969, -0.0608062744140625, -0.05793952941894531, -0.055072784423828125, -0.05220603942871094, -0.04933929443359375, -0.04647254943847656, -0.043605804443359375, -0.04073905944824219, -0.037872314453125, -0.03500556945800781, -0.032138824462890625, -0.029272079467773438, -0.02640533447265625, -0.023538589477539062, -0.020671844482421875, -0.017805099487304688, -0.0149383544921875, -0.012071609497070312, -0.009204864501953125, -0.0063381195068359375, -0.00347137451171875, -0.0006046295166015625, 0.002262115478515625, 0.0051288604736328125, 0.00799560546875, 0.010862350463867188, 0.013729095458984375, 0.016595840454101562, 0.01946258544921875, 0.022329330444335938, 0.025196075439453125, 0.028062820434570312, 0.0309295654296875, 0.03379631042480469, 0.036663055419921875, 0.03952980041503906, 0.04239654541015625, 0.04526329040527344, 0.048130035400390625, 0.05099678039550781, 0.053863525390625, 0.05673027038574219, 0.059597015380859375, 0.06246376037597656, 0.06533050537109375, 0.06819725036621094, 0.07106399536132812, 0.07393074035644531, 0.0767974853515625, 0.07966423034667969, 0.08253097534179688, 0.08539772033691406, 0.08826446533203125, 0.09113121032714844, 0.09399795532226562, 0.09686470031738281, 0.0997314453125]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 4.0, 10.0, 15.0, 29.0, 61.0, 104.0, 203.0, 230.0, 169.0, 85.0, 50.0, 28.0, 15.0, 6.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0018103704787790775, -0.0016513746231794357, -0.0014923788839951158, -0.0013333831448107958, -0.001174387289211154, -0.0010153914336115122, -0.0008563956944271922, -0.0006973999552428722, -0.0005384040996432304, -0.00037940830225124955, -0.00022041250485926867, -6.141670746728778e-05, 9.757908992469311e-05, 0.000256574887316674, 0.0004155706847086549, 0.0005745664238929749, 0.0007335622794926167, 0.0008925580768845975, 0.0010515538742765784, 0.0012105496134608984, 0.0013695454690605402, 0.001528541324660182, 0.001687537063844502, 0.001846532803028822, 0.0020055286586284637, 0.0021645245142281055, 0.0023235203698277473, 0.0024825159925967455, 0.0026415118481963873, 0.002800507703796029, 0.0029595033265650272, 0.003118499182164669, 0.003277495503425598, 0.00343649135902524, 0.0035954872146248817, 0.00375448283739388, 0.003913478925824165, 0.00407247431576252, 0.004231470171362162, 0.0043904660269618034, 0.004549461882561445, 0.004708457738161087, 0.004867453593760729, 0.005026449449360371, 0.005185444839298725, 0.005344440694898367, 0.005503436550498009, 0.0056624324060976505, 0.005821428261697292, 0.005980424117296934, 0.006139419972896576, 0.006298415828496218, 0.0064574116840958595, 0.006616407074034214, 0.006775402929633856, 0.006934398785233498, 0.007093394640833139, 0.007252390496432781, 0.007411386352032423, 0.007570382207632065, 0.007729377597570419, 0.007888373918831348, 0.008047369308769703, 0.008206365630030632, 0.008365361019968987]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 5.0, 5.0, 7.0, 9.0, 8.0, 11.0, 12.0, 12.0, 13.0, 22.0, 35.0, 36.0, 24.0, 38.0, 42.0, 23.0, 43.0, 46.0, 43.0, 35.0, 41.0, 40.0, 29.0, 46.0, 31.0, 37.0, 34.0, 35.0, 30.0, 30.0, 34.0, 28.0, 15.0, 19.0, 9.0, 19.0, 14.0, 9.0, 4.0, 9.0, 6.0, 3.0, 4.0, 1.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.0019698143005371094, -0.0019105495885014534, -0.0018512848764657974, -0.0017920201644301414, -0.0017327554523944855, -0.0016734907403588295, -0.0016142260283231735, -0.0015549613162875175, -0.0014956966042518616, -0.0014364318922162056, -0.0013771671801805496, -0.0013179024681448936, -0.0012586377561092377, -0.0011993730440735817, -0.0011401083320379257, -0.0010808436200022697, -0.0010215789079666138, -0.0009623141959309578, -0.0009030494838953018, -0.0008437847718596458, -0.0007845200598239899, -0.0007252553477883339, -0.0006659906357526779, -0.0006067259237170219, -0.000547461211681366, -0.00048819649964571, -0.000428931787610054, -0.00036966707557439804, -0.00031040236353874207, -0.0002511376515030861, -0.00019187293946743011, -0.00013260822743177414, -7.334351539611816e-05, -1.4078803360462189e-05, 4.518590867519379e-05, 0.00010445062071084976, 0.00016371533274650574, 0.0002229800447821617, 0.0002822447568178177, 0.00034150946885347366, 0.00040077418088912964, 0.0004600388929247856, 0.0005193036049604416, 0.0005785683169960976, 0.0006378330290317535, 0.0006970977410674095, 0.0007563624531030655, 0.0008156271651387215, 0.0008748918771743774, 0.0009341565892100334, 0.0009934213012456894, 0.0010526860132813454, 0.0011119507253170013, 0.0011712154373526573, 0.0012304801493883133, 0.0012897448614239693, 0.0013490095734596252, 0.0014082742854952812, 0.0014675389975309372, 0.0015268037095665932, 0.0015860684216022491, 0.0016453331336379051, 0.001704597845673561, 0.001763862557709217, 0.001823127269744873]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 1.0, 4.0, 2.0, 7.0, 5.0, 9.0, 6.0, 12.0, 9.0, 11.0, 20.0, 16.0, 15.0, 16.0, 27.0, 28.0, 32.0, 34.0, 36.0, 40.0, 39.0, 33.0, 39.0, 46.0, 45.0, 48.0, 38.0, 28.0, 41.0, 29.0, 30.0, 34.0, 47.0, 24.0, 24.0, 11.0, 13.0, 26.0, 20.0, 16.0, 9.0, 7.0, 6.0, 5.0, 6.0, 6.0, 3.0, 4.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.5234375, -5.3228759765625, -5.122314453125, -4.9217529296875, -4.72119140625, -4.5206298828125, -4.320068359375, -4.1195068359375, -3.9189453125, -3.7183837890625, -3.517822265625, -3.3172607421875, -3.11669921875, -2.9161376953125, -2.715576171875, -2.5150146484375, -2.314453125, -2.1138916015625, -1.913330078125, -1.7127685546875, -1.51220703125, -1.3116455078125, -1.111083984375, -0.9105224609375, -0.7099609375, -0.5093994140625, -0.308837890625, -0.1082763671875, 0.09228515625, 0.2928466796875, 0.493408203125, 0.6939697265625, 0.89453125, 1.0950927734375, 1.295654296875, 1.4962158203125, 1.69677734375, 1.8973388671875, 2.097900390625, 2.2984619140625, 2.4990234375, 2.6995849609375, 2.900146484375, 3.1007080078125, 3.30126953125, 3.5018310546875, 3.702392578125, 3.9029541015625, 4.103515625, 4.3040771484375, 4.504638671875, 4.7052001953125, 4.90576171875, 5.1063232421875, 5.306884765625, 5.5074462890625, 5.7080078125, 5.9085693359375, 6.109130859375, 6.3096923828125, 6.51025390625, 6.7108154296875, 6.911376953125, 7.1119384765625, 7.3125]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 9.0, 8.0, 13.0, 20.0, 21.0, 31.0, 38.0, 72.0, 113.0, 203.0, 313.0, 485.0, 798.0, 1393.0, 2177.0, 3882.0, 7034.0, 13261.0, 28969.0, 74106.0, 223881.0, 434586.0, 155868.0, 54069.0, 22348.0, 10878.0, 5764.0, 3230.0, 1928.0, 1196.0, 664.0, 444.0, 250.0, 193.0, 109.0, 63.0, 43.0, 32.0, 22.0, 12.0, 11.0, 5.0, 7.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.15234375, -4.9930419921875, -4.833740234375, -4.6744384765625, -4.51513671875, -4.3558349609375, -4.196533203125, -4.0372314453125, -3.8779296875, -3.7186279296875, -3.559326171875, -3.4000244140625, -3.24072265625, -3.0814208984375, -2.922119140625, -2.7628173828125, -2.603515625, -2.4442138671875, -2.284912109375, -2.1256103515625, -1.96630859375, -1.8070068359375, -1.647705078125, -1.4884033203125, -1.3291015625, -1.1697998046875, -1.010498046875, -0.8511962890625, -0.69189453125, -0.5325927734375, -0.373291015625, -0.2139892578125, -0.0546875, 0.1046142578125, 0.263916015625, 0.4232177734375, 0.58251953125, 0.7418212890625, 0.901123046875, 1.0604248046875, 1.2197265625, 1.3790283203125, 1.538330078125, 1.6976318359375, 1.85693359375, 2.0162353515625, 2.175537109375, 2.3348388671875, 2.494140625, 2.6534423828125, 2.812744140625, 2.9720458984375, 3.13134765625, 3.2906494140625, 3.449951171875, 3.6092529296875, 3.7685546875, 3.9278564453125, 4.087158203125, 4.2464599609375, 4.40576171875, 4.5650634765625, 4.724365234375, 4.8836669921875, 5.04296875]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 4.0, 5.0, 4.0, 3.0, 6.0, 9.0, 15.0, 19.0, 12.0, 14.0, 19.0, 25.0, 30.0, 38.0, 32.0, 41.0, 51.0, 52.0, 73.0, 97.0, 286.0, 1617.0, 145.0, 66.0, 58.0, 58.0, 35.0, 35.0, 28.0, 30.0, 28.0, 21.0, 20.0, 12.0, 10.0, 16.0, 11.0, 4.0, 4.0, 9.0, 4.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-22.53125, -21.80908203125, -21.0869140625, -20.36474609375, -19.642578125, -18.92041015625, -18.1982421875, -17.47607421875, -16.75390625, -16.03173828125, -15.3095703125, -14.58740234375, -13.865234375, -13.14306640625, -12.4208984375, -11.69873046875, -10.9765625, -10.25439453125, -9.5322265625, -8.81005859375, -8.087890625, -7.36572265625, -6.6435546875, -5.92138671875, -5.19921875, -4.47705078125, -3.7548828125, -3.03271484375, -2.310546875, -1.58837890625, -0.8662109375, -0.14404296875, 0.578125, 1.30029296875, 2.0224609375, 2.74462890625, 3.466796875, 4.18896484375, 4.9111328125, 5.63330078125, 6.35546875, 7.07763671875, 7.7998046875, 8.52197265625, 9.244140625, 9.96630859375, 10.6884765625, 11.41064453125, 12.1328125, 12.85498046875, 13.5771484375, 14.29931640625, 15.021484375, 15.74365234375, 16.4658203125, 17.18798828125, 17.91015625, 18.63232421875, 19.3544921875, 20.07666015625, 20.798828125, 21.52099609375, 22.2431640625, 22.96533203125, 23.6875]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 0.0, 0.0, 5.0, 3.0, 7.0, 12.0, 7.0, 12.0, 18.0, 19.0, 23.0, 22.0, 32.0, 39.0, 61.0, 74.0, 120.0, 133.0, 212.0, 301.0, 560.0, 3099.0, 855099.0, 2280285.0, 3778.0, 567.0, 329.0, 222.0, 148.0, 132.0, 91.0, 57.0, 39.0, 35.0, 38.0, 22.0, 29.0, 16.0, 16.0, 7.0, 12.0, 3.0, 3.0, 6.0, 2.0, 7.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-56.40625, -54.69873046875, -52.9912109375, -51.28369140625, -49.576171875, -47.86865234375, -46.1611328125, -44.45361328125, -42.74609375, -41.03857421875, -39.3310546875, -37.62353515625, -35.916015625, -34.20849609375, -32.5009765625, -30.79345703125, -29.0859375, -27.37841796875, -25.6708984375, -23.96337890625, -22.255859375, -20.54833984375, -18.8408203125, -17.13330078125, -15.42578125, -13.71826171875, -12.0107421875, -10.30322265625, -8.595703125, -6.88818359375, -5.1806640625, -3.47314453125, -1.765625, -0.05810546875, 1.6494140625, 3.35693359375, 5.064453125, 6.77197265625, 8.4794921875, 10.18701171875, 11.89453125, 13.60205078125, 15.3095703125, 17.01708984375, 18.724609375, 20.43212890625, 22.1396484375, 23.84716796875, 25.5546875, 27.26220703125, 28.9697265625, 30.67724609375, 32.384765625, 34.09228515625, 35.7998046875, 37.50732421875, 39.21484375, 40.92236328125, 42.6298828125, 44.33740234375, 46.044921875, 47.75244140625, 49.4599609375, 51.16748046875, 52.875]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 153.0, 806.0, 55.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.01434326171875, -22.866750717163086, -17.719158172607422, -12.571565628051758, -7.423973083496094, -2.2763805389404297, 2.8712120056152344, 8.018806457519531, 13.166397094726562, 18.313989639282227, 23.46158218383789, 28.609174728393555, 33.75676727294922, 38.90435791015625, 44.05195236206055, 49.199546813964844, 54.347137451171875, 59.494728088378906, 64.64231872558594, 69.7899169921875, 74.93750762939453, 80.08509826660156, 85.23269653320312, 90.38028717041016, 95.52787780761719, 100.67546844482422, 105.82305908203125, 110.97065734863281, 116.11824798583984, 121.26583862304688, 126.41343688964844, 131.56103515625, 136.7086181640625, 141.85621643066406, 147.00379943847656, 152.15139770507812, 157.29898071289062, 162.4465789794922, 167.59417724609375, 172.74176025390625, 177.8893585205078, 183.03695678710938, 188.18453979492188, 193.33213806152344, 198.479736328125, 203.6273193359375, 208.77491760253906, 213.92251586914062, 219.07009887695312, 224.2176971435547, 229.3652801513672, 234.51287841796875, 239.66046142578125, 244.8080596923828, 249.95565795898438, 255.10324096679688, 260.2508544921875, 265.3984375, 270.5460510253906, 275.6936340332031, 280.8412170410156, 285.98883056640625, 291.13641357421875, 296.28399658203125, 301.43157958984375]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 0.0, 2.0, 5.0, 4.0, 6.0, 8.0, 6.0, 12.0, 5.0, 9.0, 12.0, 18.0, 9.0, 18.0, 14.0, 27.0, 23.0, 24.0, 29.0, 29.0, 32.0, 29.0, 42.0, 33.0, 36.0, 42.0, 39.0, 46.0, 41.0, 32.0, 33.0, 42.0, 29.0, 37.0, 28.0, 24.0, 23.0, 22.0, 16.0, 12.0, 12.0, 12.0, 11.0, 12.0, 8.0, 8.0, 9.0, 3.0, 7.0, 6.0, 3.0, 5.0, 5.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 3.0], "bins": [-43.49616241455078, -42.049827575683594, -40.603492736816406, -39.15715789794922, -37.71082305908203, -36.26448440551758, -34.81814956665039, -33.3718147277832, -31.925479888916016, -30.479145050048828, -29.03281021118164, -27.58647346496582, -26.140138626098633, -24.693803787231445, -23.247467041015625, -21.801132202148438, -20.35479736328125, -18.908462524414062, -17.462127685546875, -16.015790939331055, -14.569456100463867, -13.12312126159668, -11.676785469055176, -10.230449676513672, -8.784114837646484, -7.337779521942139, -5.891444206237793, -4.445108890533447, -2.9987735748291016, -1.5524382591247559, -0.10610294342041016, 1.3402328491210938, 2.7865676879882812, 4.232903003692627, 5.679238319396973, 7.125573635101318, 8.571908950805664, 10.018243789672852, 11.464579582214355, 12.91091537475586, 14.357250213623047, 15.803585052490234, 17.249919891357422, 18.696256637573242, 20.14259147644043, 21.588926315307617, 23.035263061523438, 24.481597900390625, 25.927932739257812, 27.374267578125, 28.820602416992188, 30.266939163208008, 31.713274002075195, 33.159610748291016, 34.6059455871582, 36.05228042602539, 37.49861526489258, 38.944950103759766, 40.39128494262695, 41.83761978149414, 43.283958435058594, 44.73029327392578, 46.17662811279297, 47.622962951660156, 49.069297790527344]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 4.0, 1.0, 13.0, 5.0, 10.0, 10.0, 15.0, 18.0, 16.0, 17.0, 29.0, 30.0, 22.0, 30.0, 35.0, 36.0, 32.0, 34.0, 34.0, 38.0, 47.0, 44.0, 45.0, 35.0, 33.0, 29.0, 44.0, 33.0, 28.0, 34.0, 27.0, 26.0, 16.0, 24.0, 17.0, 18.0, 12.0, 11.0, 11.0, 9.0, 8.0, 5.0, 6.0, 4.0, 1.0, 0.0, 7.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.8359375, -5.63201904296875, -5.4281005859375, -5.22418212890625, -5.020263671875, -4.81634521484375, -4.6124267578125, -4.40850830078125, -4.20458984375, -4.00067138671875, -3.7967529296875, -3.59283447265625, -3.388916015625, -3.18499755859375, -2.9810791015625, -2.77716064453125, -2.5732421875, -2.36932373046875, -2.1654052734375, -1.96148681640625, -1.757568359375, -1.55364990234375, -1.3497314453125, -1.14581298828125, -0.94189453125, -0.73797607421875, -0.5340576171875, -0.33013916015625, -0.126220703125, 0.07769775390625, 0.2816162109375, 0.48553466796875, 0.689453125, 0.89337158203125, 1.0972900390625, 1.30120849609375, 1.505126953125, 1.70904541015625, 1.9129638671875, 2.11688232421875, 2.32080078125, 2.52471923828125, 2.7286376953125, 2.93255615234375, 3.136474609375, 3.34039306640625, 3.5443115234375, 3.74822998046875, 3.9521484375, 4.15606689453125, 4.3599853515625, 4.56390380859375, 4.767822265625, 4.97174072265625, 5.1756591796875, 5.37957763671875, 5.58349609375, 5.78741455078125, 5.9913330078125, 6.19525146484375, 6.399169921875, 6.60308837890625, 6.8070068359375, 7.01092529296875, 7.21484375]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 7.0, 0.0, 5.0, 4.0, 10.0, 6.0, 16.0, 11.0, 14.0, 12.0, 12.0, 33.0, 26.0, 32.0, 46.0, 56.0, 93.0, 205.0, 436.0, 1288.0, 4578.0, 27088.0, 519366.0, 3174116.0, 436548.0, 23766.0, 4187.0, 1221.0, 489.0, 215.0, 105.0, 59.0, 52.0, 37.0, 19.0, 28.0, 20.0, 17.0, 14.0, 14.0, 12.0, 7.0, 5.0, 3.0, 4.0, 4.0, 4.0, 1.0, 6.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.546875, -15.921875, -15.296875, -14.671875, -14.046875, -13.421875, -12.796875, -12.171875, -11.546875, -10.921875, -10.296875, -9.671875, -9.046875, -8.421875, -7.796875, -7.171875, -6.546875, -5.921875, -5.296875, -4.671875, -4.046875, -3.421875, -2.796875, -2.171875, -1.546875, -0.921875, -0.296875, 0.328125, 0.953125, 1.578125, 2.203125, 2.828125, 3.453125, 4.078125, 4.703125, 5.328125, 5.953125, 6.578125, 7.203125, 7.828125, 8.453125, 9.078125, 9.703125, 10.328125, 10.953125, 11.578125, 12.203125, 12.828125, 13.453125, 14.078125, 14.703125, 15.328125, 15.953125, 16.578125, 17.203125, 17.828125, 18.453125, 19.078125, 19.703125, 20.328125, 20.953125, 21.578125, 22.203125, 22.828125, 23.453125]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 4.0, 6.0, 6.0, 4.0, 11.0, 12.0, 9.0, 16.0, 13.0, 32.0, 35.0, 32.0, 39.0, 56.0, 86.0, 87.0, 115.0, 152.0, 187.0, 251.0, 333.0, 392.0, 407.0, 387.0, 323.0, 224.0, 202.0, 149.0, 114.0, 97.0, 52.0, 60.0, 35.0, 31.0, 22.0, 20.0, 14.0, 17.0, 10.0, 12.0, 10.0, 5.0, 3.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-10.921875, -10.594482421875, -10.26708984375, -9.939697265625, -9.6123046875, -9.284912109375, -8.95751953125, -8.630126953125, -8.302734375, -7.975341796875, -7.64794921875, -7.320556640625, -6.9931640625, -6.665771484375, -6.33837890625, -6.010986328125, -5.68359375, -5.356201171875, -5.02880859375, -4.701416015625, -4.3740234375, -4.046630859375, -3.71923828125, -3.391845703125, -3.064453125, -2.737060546875, -2.40966796875, -2.082275390625, -1.7548828125, -1.427490234375, -1.10009765625, -0.772705078125, -0.4453125, -0.117919921875, 0.20947265625, 0.536865234375, 0.8642578125, 1.191650390625, 1.51904296875, 1.846435546875, 2.173828125, 2.501220703125, 2.82861328125, 3.156005859375, 3.4833984375, 3.810791015625, 4.13818359375, 4.465576171875, 4.79296875, 5.120361328125, 5.44775390625, 5.775146484375, 6.1025390625, 6.429931640625, 6.75732421875, 7.084716796875, 7.412109375, 7.739501953125, 8.06689453125, 8.394287109375, 8.7216796875, 9.049072265625, 9.37646484375, 9.703857421875, 10.03125]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 4.0, 5.0, 1.0, 9.0, 16.0, 15.0, 15.0, 19.0, 25.0, 31.0, 47.0, 58.0, 65.0, 78.0, 105.0, 125.0, 182.0, 219.0, 305.0, 402.0, 1587.0, 41038.0, 3824102.0, 319366.0, 4392.0, 592.0, 311.0, 219.0, 191.0, 159.0, 107.0, 98.0, 81.0, 65.0, 61.0, 39.0, 36.0, 32.0, 17.0, 21.0, 7.0, 11.0, 9.0, 5.0, 7.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-48.84375, -47.30322265625, -45.7626953125, -44.22216796875, -42.681640625, -41.14111328125, -39.6005859375, -38.06005859375, -36.51953125, -34.97900390625, -33.4384765625, -31.89794921875, -30.357421875, -28.81689453125, -27.2763671875, -25.73583984375, -24.1953125, -22.65478515625, -21.1142578125, -19.57373046875, -18.033203125, -16.49267578125, -14.9521484375, -13.41162109375, -11.87109375, -10.33056640625, -8.7900390625, -7.24951171875, -5.708984375, -4.16845703125, -2.6279296875, -1.08740234375, 0.453125, 1.99365234375, 3.5341796875, 5.07470703125, 6.615234375, 8.15576171875, 9.6962890625, 11.23681640625, 12.77734375, 14.31787109375, 15.8583984375, 17.39892578125, 18.939453125, 20.47998046875, 22.0205078125, 23.56103515625, 25.1015625, 26.64208984375, 28.1826171875, 29.72314453125, 31.263671875, 32.80419921875, 34.3447265625, 35.88525390625, 37.42578125, 38.96630859375, 40.5068359375, 42.04736328125, 43.587890625, 45.12841796875, 46.6689453125, 48.20947265625, 49.75]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 6.0, 12.0, 43.0, 81.0, 157.0, 204.0, 213.0, 153.0, 89.0, 36.0, 14.0, 6.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-96.66555786132812, -93.73625183105469, -90.80694580078125, -87.87764739990234, -84.9483413696289, -82.01903533935547, -79.08973693847656, -76.16043090820312, -73.23112487792969, -70.30181884765625, -67.37251281738281, -64.4432144165039, -61.51390838623047, -58.58460235595703, -55.65530014038086, -52.72599792480469, -49.79669189453125, -46.86738586425781, -43.93808364868164, -41.00878143310547, -38.07947540283203, -35.150169372558594, -32.22086715698242, -29.291563034057617, -26.362258911132812, -23.432954788208008, -20.503650665283203, -17.5743465423584, -14.645042419433594, -11.715738296508789, -8.786434173583984, -5.85713005065918, -2.9278182983398438, 0.0014858245849609375, 2.9307899475097656, 5.86009407043457, 8.789398193359375, 11.71870231628418, 14.648006439208984, 17.57731056213379, 20.506614685058594, 23.4359188079834, 26.365222930908203, 29.294527053833008, 32.22383117675781, 35.15313720703125, 38.08243942260742, 41.011741638183594, 43.94104766845703, 46.87035369873047, 49.79965591430664, 52.72895812988281, 55.65826416015625, 58.58757019042969, 61.51687240600586, 64.44617462158203, 67.37548065185547, 70.3047866821289, 73.23408508300781, 76.16339111328125, 79.09269714355469, 82.02200317382812, 84.95130920410156, 87.88060760498047, 90.8099136352539]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0, 5.0, 2.0, 4.0, 9.0, 8.0, 6.0, 11.0, 16.0, 15.0, 20.0, 19.0, 29.0, 26.0, 33.0, 32.0, 35.0, 34.0, 43.0, 30.0, 43.0, 42.0, 30.0, 51.0, 29.0, 55.0, 36.0, 31.0, 34.0, 30.0, 31.0, 32.0, 22.0, 26.0, 19.0, 14.0, 21.0, 18.0, 17.0, 11.0, 12.0, 6.0, 3.0, 6.0, 6.0, 8.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.440338134765625, -39.168846130371094, -37.8973503112793, -36.625858306884766, -35.35436248779297, -34.08287048339844, -32.811378479003906, -31.539884567260742, -30.268390655517578, -28.996896743774414, -27.72540283203125, -26.45391082763672, -25.182416915893555, -23.91092300415039, -22.63943099975586, -21.367937088012695, -20.09644317626953, -18.824949264526367, -17.553455352783203, -16.281963348388672, -15.010469436645508, -13.738975524902344, -12.467482566833496, -11.195989608764648, -9.924495697021484, -8.65300178527832, -7.381508827209473, -6.110015392303467, -4.838521957397461, -3.567028522491455, -2.295535087585449, -1.0240421295166016, 0.2474517822265625, 1.5189452171325684, 2.790438652038574, 4.06193208694458, 5.333425521850586, 6.604918956756592, 7.876412391662598, 9.147905349731445, 10.41939926147461, 11.690893173217773, 12.962386131286621, 14.233879089355469, 15.505373001098633, 16.776866912841797, 18.048358917236328, 19.319852828979492, 20.591346740722656, 21.86284065246582, 23.134334564208984, 24.405826568603516, 25.67732048034668, 26.948814392089844, 28.220306396484375, 29.49180030822754, 30.763294219970703, 32.034786224365234, 33.30628204345703, 34.57777404785156, 35.849266052246094, 37.12076187133789, 38.39225387573242, 39.66374969482422, 40.93524169921875]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 6.0, 5.0, 7.0, 4.0, 3.0, 8.0, 5.0, 12.0, 15.0, 16.0, 18.0, 11.0, 23.0, 32.0, 28.0, 30.0, 21.0, 33.0, 46.0, 41.0, 40.0, 48.0, 38.0, 43.0, 44.0, 50.0, 40.0, 41.0, 41.0, 33.0, 23.0, 26.0, 28.0, 14.0, 23.0, 23.0, 18.0, 19.0, 9.0, 7.0, 9.0, 7.0, 4.0, 4.0, 7.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.921875, -5.71337890625, -5.5048828125, -5.29638671875, -5.087890625, -4.87939453125, -4.6708984375, -4.46240234375, -4.25390625, -4.04541015625, -3.8369140625, -3.62841796875, -3.419921875, -3.21142578125, -3.0029296875, -2.79443359375, -2.5859375, -2.37744140625, -2.1689453125, -1.96044921875, -1.751953125, -1.54345703125, -1.3349609375, -1.12646484375, -0.91796875, -0.70947265625, -0.5009765625, -0.29248046875, -0.083984375, 0.12451171875, 0.3330078125, 0.54150390625, 0.75, 0.95849609375, 1.1669921875, 1.37548828125, 1.583984375, 1.79248046875, 2.0009765625, 2.20947265625, 2.41796875, 2.62646484375, 2.8349609375, 3.04345703125, 3.251953125, 3.46044921875, 3.6689453125, 3.87744140625, 4.0859375, 4.29443359375, 4.5029296875, 4.71142578125, 4.919921875, 5.12841796875, 5.3369140625, 5.54541015625, 5.75390625, 5.96240234375, 6.1708984375, 6.37939453125, 6.587890625, 6.79638671875, 7.0048828125, 7.21337890625, 7.421875]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 4.0, 6.0, 12.0, 10.0, 22.0, 24.0, 52.0, 81.0, 118.0, 156.0, 279.0, 438.0, 682.0, 953.0, 1517.0, 2365.0, 3675.0, 5810.0, 9203.0, 14509.0, 23276.0, 37834.0, 61601.0, 98723.0, 147986.0, 184909.0, 159820.0, 111352.0, 69369.0, 42787.0, 26219.0, 16148.0, 10262.0, 6518.0, 4285.0, 2613.0, 1772.0, 1082.0, 724.0, 473.0, 305.0, 204.0, 138.0, 87.0, 53.0, 39.0, 21.0, 14.0, 16.0, 10.0, 3.0, 1.0, 3.0, 3.0], "bins": [-0.72900390625, -0.7085418701171875, -0.688079833984375, -0.6676177978515625, -0.64715576171875, -0.6266937255859375, -0.606231689453125, -0.5857696533203125, -0.5653076171875, -0.5448455810546875, -0.524383544921875, -0.5039215087890625, -0.48345947265625, -0.4629974365234375, -0.442535400390625, -0.4220733642578125, -0.401611328125, -0.3811492919921875, -0.360687255859375, -0.3402252197265625, -0.31976318359375, -0.2993011474609375, -0.278839111328125, -0.2583770751953125, -0.2379150390625, -0.2174530029296875, -0.196990966796875, -0.1765289306640625, -0.15606689453125, -0.1356048583984375, -0.115142822265625, -0.0946807861328125, -0.07421875, -0.0537567138671875, -0.033294677734375, -0.0128326416015625, 0.00762939453125, 0.0280914306640625, 0.048553466796875, 0.0690155029296875, 0.0894775390625, 0.1099395751953125, 0.130401611328125, 0.1508636474609375, 0.17132568359375, 0.1917877197265625, 0.212249755859375, 0.2327117919921875, 0.253173828125, 0.2736358642578125, 0.294097900390625, 0.3145599365234375, 0.33502197265625, 0.3554840087890625, 0.375946044921875, 0.3964080810546875, 0.4168701171875, 0.4373321533203125, 0.457794189453125, 0.4782562255859375, 0.49871826171875, 0.5191802978515625, 0.539642333984375, 0.5601043701171875, 0.58056640625]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 4.0, 1.0, 1.0, 4.0, 6.0, 3.0, 7.0, 4.0, 6.0, 14.0, 15.0, 11.0, 11.0, 17.0, 23.0, 25.0, 26.0, 25.0, 22.0, 21.0, 33.0, 26.0, 39.0, 45.0, 40.0, 35.0, 27.0, 1084.0, 27.0, 33.0, 46.0, 34.0, 27.0, 28.0, 30.0, 19.0, 22.0, 24.0, 25.0, 27.0, 17.0, 15.0, 17.0, 11.0, 14.0, 13.0, 12.0, 6.0, 2.0, 5.0, 1.0, 5.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.4765625, -3.36114501953125, -3.2457275390625, -3.13031005859375, -3.014892578125, -2.89947509765625, -2.7840576171875, -2.66864013671875, -2.55322265625, -2.43780517578125, -2.3223876953125, -2.20697021484375, -2.091552734375, -1.97613525390625, -1.8607177734375, -1.74530029296875, -1.6298828125, -1.51446533203125, -1.3990478515625, -1.28363037109375, -1.168212890625, -1.05279541015625, -0.9373779296875, -0.82196044921875, -0.70654296875, -0.59112548828125, -0.4757080078125, -0.36029052734375, -0.244873046875, -0.12945556640625, -0.0140380859375, 0.10137939453125, 0.216796875, 0.33221435546875, 0.4476318359375, 0.56304931640625, 0.678466796875, 0.79388427734375, 0.9093017578125, 1.02471923828125, 1.14013671875, 1.25555419921875, 1.3709716796875, 1.48638916015625, 1.601806640625, 1.71722412109375, 1.8326416015625, 1.94805908203125, 2.0634765625, 2.17889404296875, 2.2943115234375, 2.40972900390625, 2.525146484375, 2.64056396484375, 2.7559814453125, 2.87139892578125, 2.98681640625, 3.10223388671875, 3.2176513671875, 3.33306884765625, 3.448486328125, 3.56390380859375, 3.6793212890625, 3.79473876953125, 3.91015625]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 7.0, 11.0, 16.0, 27.0, 31.0, 53.0, 110.0, 177.0, 299.0, 533.0, 946.0, 1620.0, 2911.0, 4782.0, 8338.0, 13508.0, 22538.0, 37024.0, 60519.0, 97000.0, 143703.0, 1224228.0, 164383.0, 118833.0, 76963.0, 47148.0, 28668.0, 17491.0, 10565.0, 6140.0, 3560.0, 2031.0, 1282.0, 699.0, 411.0, 214.0, 161.0, 92.0, 31.0, 32.0, 17.0, 19.0, 5.0, 5.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.537109375, -0.5201873779296875, -0.503265380859375, -0.4863433837890625, -0.46942138671875, -0.4524993896484375, -0.435577392578125, -0.4186553955078125, -0.4017333984375, -0.3848114013671875, -0.367889404296875, -0.3509674072265625, -0.33404541015625, -0.3171234130859375, -0.300201416015625, -0.2832794189453125, -0.266357421875, -0.2494354248046875, -0.232513427734375, -0.2155914306640625, -0.19866943359375, -0.1817474365234375, -0.164825439453125, -0.1479034423828125, -0.1309814453125, -0.1140594482421875, -0.097137451171875, -0.0802154541015625, -0.06329345703125, -0.0463714599609375, -0.029449462890625, -0.0125274658203125, 0.00439453125, 0.0213165283203125, 0.038238525390625, 0.0551605224609375, 0.07208251953125, 0.0890045166015625, 0.105926513671875, 0.1228485107421875, 0.1397705078125, 0.1566925048828125, 0.173614501953125, 0.1905364990234375, 0.20745849609375, 0.2243804931640625, 0.241302490234375, 0.2582244873046875, 0.275146484375, 0.2920684814453125, 0.308990478515625, 0.3259124755859375, 0.34283447265625, 0.3597564697265625, 0.376678466796875, 0.3936004638671875, 0.4105224609375, 0.4274444580078125, 0.444366455078125, 0.4612884521484375, 0.47821044921875, 0.4951324462890625, 0.512054443359375, 0.5289764404296875, 0.5458984375]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 3.0, 2.0, 6.0, 2.0, 11.0, 5.0, 9.0, 7.0, 13.0, 17.0, 21.0, 15.0, 20.0, 25.0, 43.0, 53.0, 67.0, 56.0, 68.0, 75.0, 66.0, 61.0, 62.0, 60.0, 34.0, 28.0, 31.0, 21.0, 24.0, 15.0, 16.0, 16.0, 9.0, 16.0, 8.0, 6.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0], "bins": [-0.003993988037109375, -0.0038833022117614746, -0.0037726163864135742, -0.003661930561065674, -0.0035512447357177734, -0.003440558910369873, -0.0033298730850219727, -0.0032191872596740723, -0.003108501434326172, -0.0029978156089782715, -0.002887129783630371, -0.0027764439582824707, -0.0026657581329345703, -0.00255507230758667, -0.0024443864822387695, -0.002333700656890869, -0.0022230148315429688, -0.0021123290061950684, -0.002001643180847168, -0.0018909573554992676, -0.0017802715301513672, -0.0016695857048034668, -0.0015588998794555664, -0.001448214054107666, -0.0013375282287597656, -0.0012268424034118652, -0.0011161565780639648, -0.0010054707527160645, -0.0008947849273681641, -0.0007840991020202637, -0.0006734132766723633, -0.0005627274513244629, -0.0004520416259765625, -0.0003413558006286621, -0.00023066997528076172, -0.00011998414993286133, -9.298324584960938e-06, 0.00010138750076293945, 0.00021207332611083984, 0.00032275915145874023, 0.0004334449768066406, 0.000544130802154541, 0.0006548166275024414, 0.0007655024528503418, 0.0008761882781982422, 0.0009868741035461426, 0.001097559928894043, 0.0012082457542419434, 0.0013189315795898438, 0.0014296174049377441, 0.0015403032302856445, 0.001650989055633545, 0.0017616748809814453, 0.0018723607063293457, 0.001983046531677246, 0.0020937323570251465, 0.002204418182373047, 0.0023151040077209473, 0.0024257898330688477, 0.002536475658416748, 0.0026471614837646484, 0.002757847309112549, 0.0028685331344604492, 0.0029792189598083496, 0.00308990478515625]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 5.0, 11.0, 16.0, 16.0, 14.0, 21.0, 28.0, 46.0, 40.0, 68.0, 80.0, 107.0, 238.0, 1016.0, 47103.0, 990464.0, 8096.0, 524.0, 197.0, 116.0, 96.0, 51.0, 43.0, 24.0, 27.0, 12.0, 17.0, 14.0, 12.0, 6.0, 7.0, 8.0, 9.0, 6.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.06951904296875, -0.0668783187866211, -0.06423759460449219, -0.06159687042236328, -0.058956146240234375, -0.05631542205810547, -0.05367469787597656, -0.051033973693847656, -0.04839324951171875, -0.045752525329589844, -0.04311180114746094, -0.04047107696533203, -0.037830352783203125, -0.03518962860107422, -0.03254890441894531, -0.029908180236816406, -0.0272674560546875, -0.024626731872558594, -0.021986007690429688, -0.01934528350830078, -0.016704559326171875, -0.014063835144042969, -0.011423110961914062, -0.008782386779785156, -0.00614166259765625, -0.0035009384155273438, -0.0008602142333984375, 0.0017805099487304688, 0.004421234130859375, 0.007061958312988281, 0.009702682495117188, 0.012343406677246094, 0.014984130859375, 0.017624855041503906, 0.020265579223632812, 0.02290630340576172, 0.025547027587890625, 0.02818775177001953, 0.030828475952148438, 0.033469200134277344, 0.03610992431640625, 0.038750648498535156, 0.04139137268066406, 0.04403209686279297, 0.046672821044921875, 0.04931354522705078, 0.05195426940917969, 0.054594993591308594, 0.0572357177734375, 0.059876441955566406, 0.06251716613769531, 0.06515789031982422, 0.06779861450195312, 0.07043933868408203, 0.07308006286621094, 0.07572078704833984, 0.07836151123046875, 0.08100223541259766, 0.08364295959472656, 0.08628368377685547, 0.08892440795898438, 0.09156513214111328, 0.09420585632324219, 0.0968465805053711, 0.0994873046875]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 38.0, 518.0, 418.0, 34.0, 6.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002878597006201744, -0.0021503595635294914, -0.0014221223536878824, -0.0006938851438462734, 3.435229882597923e-05, 0.0007625897414982319, 0.0014908267185091972, 0.00221906416118145, 0.0029473016038537025, 0.003675539046525955, 0.004403776489198208, 0.005132013466209173, 0.005860250908881426, 0.0065884883515536785, 0.007316725328564644, 0.008044962771236897, 0.00877320021390915, 0.009501437656581402, 0.010229675099253654, 0.010957911610603333, 0.01168614998459816, 0.012414386495947838, 0.01314262393862009, 0.013870861381292343, 0.014599098823964596, 0.015327336266636848, 0.016055572777986526, 0.016783811151981354, 0.017512047663331032, 0.01824028603732586, 0.018968522548675537, 0.019696760922670364, 0.02042499929666519, 0.02115323580801487, 0.021881474182009697, 0.022609710693359375, 0.023337949067354202, 0.02406618557870388, 0.02479442209005356, 0.025522660464048386, 0.026250898838043213, 0.02697913534939289, 0.027707373723387718, 0.028435610234737396, 0.029163848608732224, 0.0298920851200819, 0.03062032163143158, 0.03134856000542641, 0.032076798379421234, 0.03280503675341606, 0.03353327140212059, 0.03426150977611542, 0.034989748150110245, 0.03571798652410507, 0.0364462211728096, 0.03717445954680443, 0.03790269419550896, 0.038630932569503784, 0.03935916721820831, 0.04008740559220314, 0.04081564396619797, 0.041543882340192795, 0.042272116988897324, 0.04300035536289215, 0.04372859373688698]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 5.0, 7.0, 12.0, 16.0, 15.0, 26.0, 28.0, 33.0, 37.0, 39.0, 56.0, 63.0, 63.0, 62.0, 61.0, 76.0, 70.0, 67.0, 42.0, 45.0, 57.0, 26.0, 19.0, 21.0, 15.0, 17.0, 9.0, 8.0, 8.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00315779447555542, -0.0030496595427393913, -0.0029415246099233627, -0.002833389677107334, -0.0027252547442913055, -0.002617119811475277, -0.0025089848786592484, -0.0024008499458432198, -0.002292715013027191, -0.0021845800802111626, -0.002076445147395134, -0.0019683102145791054, -0.0018601752817630768, -0.0017520403489470482, -0.0016439054161310196, -0.001535770483314991, -0.0014276355504989624, -0.0013195006176829338, -0.0012113656848669052, -0.0011032307520508766, -0.000995095819234848, -0.0008869608864188194, -0.0007788259536027908, -0.0006706910207867622, -0.0005625560879707336, -0.00045442115515470505, -0.00034628622233867645, -0.00023815128952264786, -0.00013001635670661926, -2.1881423890590668e-05, 8.625350892543793e-05, 0.00019438844174146652, 0.0003025233745574951, 0.0004106583073735237, 0.0005187932401895523, 0.0006269281730055809, 0.0007350631058216095, 0.0008431980386376381, 0.0009513329714536667, 0.0010594679042696953, 0.0011676028370857239, 0.0012757377699017525, 0.001383872702717781, 0.0014920076355338097, 0.0016001425683498383, 0.0017082775011658669, 0.0018164124339818954, 0.001924547366797924, 0.0020326822996139526, 0.0021408172324299812, 0.00224895216524601, 0.0023570870980620384, 0.002465222030878067, 0.0025733569636940956, 0.002681491896510124, 0.002789626829326153, 0.0028977617621421814, 0.00300589669495821, 0.0031140316277742386, 0.003222166560590267, 0.0033303014934062958, 0.0034384364262223244, 0.003546571359038353, 0.0036547062918543816, 0.00376284122467041]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 6.0, 5.0, 7.0, 4.0, 3.0, 8.0, 5.0, 12.0, 15.0, 16.0, 18.0, 11.0, 23.0, 32.0, 28.0, 30.0, 21.0, 33.0, 46.0, 41.0, 40.0, 48.0, 38.0, 43.0, 44.0, 50.0, 40.0, 41.0, 41.0, 32.0, 24.0, 26.0, 28.0, 14.0, 23.0, 23.0, 18.0, 19.0, 9.0, 7.0, 9.0, 7.0, 4.0, 4.0, 7.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.921875, -5.71337890625, -5.5048828125, -5.29638671875, -5.087890625, -4.87939453125, -4.6708984375, -4.46240234375, -4.25390625, -4.04541015625, -3.8369140625, -3.62841796875, -3.419921875, -3.21142578125, -3.0029296875, -2.79443359375, -2.5859375, -2.37744140625, -2.1689453125, -1.96044921875, -1.751953125, -1.54345703125, -1.3349609375, -1.12646484375, -0.91796875, -0.70947265625, -0.5009765625, -0.29248046875, -0.083984375, 0.12451171875, 0.3330078125, 0.54150390625, 0.75, 0.95849609375, 1.1669921875, 1.37548828125, 1.583984375, 1.79248046875, 2.0009765625, 2.20947265625, 2.41796875, 2.62646484375, 2.8349609375, 3.04345703125, 3.251953125, 3.46044921875, 3.6689453125, 3.87744140625, 4.0859375, 4.29443359375, 4.5029296875, 4.71142578125, 4.919921875, 5.12841796875, 5.3369140625, 5.54541015625, 5.75390625, 5.96240234375, 6.1708984375, 6.37939453125, 6.587890625, 6.79638671875, 7.0048828125, 7.21337890625, 7.421875]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 1.0, 8.0, 8.0, 11.0, 7.0, 18.0, 23.0, 34.0, 32.0, 53.0, 57.0, 81.0, 125.0, 171.0, 283.0, 430.0, 882.0, 1753.0, 3752.0, 8442.0, 20365.0, 53640.0, 156912.0, 488872.0, 202755.0, 65841.0, 24978.0, 10138.0, 4431.0, 2025.0, 934.0, 495.0, 320.0, 203.0, 132.0, 81.0, 57.0, 50.0, 40.0, 29.0, 27.0, 17.0, 13.0, 10.0, 6.0, 4.0, 3.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-6.41796875, -6.208251953125, -5.99853515625, -5.788818359375, -5.5791015625, -5.369384765625, -5.15966796875, -4.949951171875, -4.740234375, -4.530517578125, -4.32080078125, -4.111083984375, -3.9013671875, -3.691650390625, -3.48193359375, -3.272216796875, -3.0625, -2.852783203125, -2.64306640625, -2.433349609375, -2.2236328125, -2.013916015625, -1.80419921875, -1.594482421875, -1.384765625, -1.175048828125, -0.96533203125, -0.755615234375, -0.5458984375, -0.336181640625, -0.12646484375, 0.083251953125, 0.29296875, 0.502685546875, 0.71240234375, 0.922119140625, 1.1318359375, 1.341552734375, 1.55126953125, 1.760986328125, 1.970703125, 2.180419921875, 2.39013671875, 2.599853515625, 2.8095703125, 3.019287109375, 3.22900390625, 3.438720703125, 3.6484375, 3.858154296875, 4.06787109375, 4.277587890625, 4.4873046875, 4.697021484375, 4.90673828125, 5.116455078125, 5.326171875, 5.535888671875, 5.74560546875, 5.955322265625, 6.1650390625, 6.374755859375, 6.58447265625, 6.794189453125, 7.00390625]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 2.0, 2.0, 10.0, 10.0, 7.0, 7.0, 6.0, 8.0, 15.0, 16.0, 19.0, 14.0, 33.0, 30.0, 30.0, 31.0, 39.0, 34.0, 56.0, 50.0, 109.0, 384.0, 1582.0, 110.0, 59.0, 55.0, 42.0, 36.0, 42.0, 25.0, 23.0, 24.0, 16.0, 14.0, 13.0, 25.0, 14.0, 13.0, 8.0, 7.0, 5.0, 7.0, 5.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.828125, -18.22216796875, -17.6162109375, -17.01025390625, -16.404296875, -15.79833984375, -15.1923828125, -14.58642578125, -13.98046875, -13.37451171875, -12.7685546875, -12.16259765625, -11.556640625, -10.95068359375, -10.3447265625, -9.73876953125, -9.1328125, -8.52685546875, -7.9208984375, -7.31494140625, -6.708984375, -6.10302734375, -5.4970703125, -4.89111328125, -4.28515625, -3.67919921875, -3.0732421875, -2.46728515625, -1.861328125, -1.25537109375, -0.6494140625, -0.04345703125, 0.5625, 1.16845703125, 1.7744140625, 2.38037109375, 2.986328125, 3.59228515625, 4.1982421875, 4.80419921875, 5.41015625, 6.01611328125, 6.6220703125, 7.22802734375, 7.833984375, 8.43994140625, 9.0458984375, 9.65185546875, 10.2578125, 10.86376953125, 11.4697265625, 12.07568359375, 12.681640625, 13.28759765625, 13.8935546875, 14.49951171875, 15.10546875, 15.71142578125, 16.3173828125, 16.92333984375, 17.529296875, 18.13525390625, 18.7412109375, 19.34716796875, 19.953125]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 3.0, 2.0, 1.0, 3.0, 4.0, 3.0, 4.0, 1.0, 8.0, 7.0, 16.0, 11.0, 17.0, 19.0, 26.0, 31.0, 30.0, 35.0, 45.0, 72.0, 90.0, 143.0, 218.0, 326.0, 663.0, 1176.0, 6112.0, 2706212.0, 424309.0, 3461.0, 1071.0, 562.0, 300.0, 182.0, 141.0, 87.0, 68.0, 35.0, 42.0, 42.0, 24.0, 8.0, 23.0, 22.0, 13.0, 10.0, 4.0, 8.0, 8.0, 4.0, 0.0, 5.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-45.71875, -44.28564453125, -42.8525390625, -41.41943359375, -39.986328125, -38.55322265625, -37.1201171875, -35.68701171875, -34.25390625, -32.82080078125, -31.3876953125, -29.95458984375, -28.521484375, -27.08837890625, -25.6552734375, -24.22216796875, -22.7890625, -21.35595703125, -19.9228515625, -18.48974609375, -17.056640625, -15.62353515625, -14.1904296875, -12.75732421875, -11.32421875, -9.89111328125, -8.4580078125, -7.02490234375, -5.591796875, -4.15869140625, -2.7255859375, -1.29248046875, 0.140625, 1.57373046875, 3.0068359375, 4.43994140625, 5.873046875, 7.30615234375, 8.7392578125, 10.17236328125, 11.60546875, 13.03857421875, 14.4716796875, 15.90478515625, 17.337890625, 18.77099609375, 20.2041015625, 21.63720703125, 23.0703125, 24.50341796875, 25.9365234375, 27.36962890625, 28.802734375, 30.23583984375, 31.6689453125, 33.10205078125, 34.53515625, 35.96826171875, 37.4013671875, 38.83447265625, 40.267578125, 41.70068359375, 43.1337890625, 44.56689453125, 46.0]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 22.0, 42.0, 62.0, 84.0, 107.0, 155.0, 175.0, 126.0, 85.0, 69.0, 38.0, 20.0, 4.0, 6.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-36.023704528808594, -35.27062225341797, -34.51754379272461, -33.764461517333984, -33.011383056640625, -32.25830078125, -31.505218505859375, -30.752138137817383, -29.99905776977539, -29.2459774017334, -28.492897033691406, -27.73981475830078, -26.98673439025879, -26.233654022216797, -25.480571746826172, -24.72749137878418, -23.974411010742188, -23.221330642700195, -22.468250274658203, -21.715167999267578, -20.962087631225586, -20.209007263183594, -19.45592498779297, -18.702844619750977, -17.949764251708984, -17.196683883666992, -16.443603515625, -15.690521240234375, -14.937440872192383, -14.18436050415039, -13.431279182434082, -12.678197860717773, -11.925118446350098, -11.172037124633789, -10.418956756591797, -9.665876388549805, -8.912795066833496, -8.159713745117188, -7.406633377075195, -6.653552532196045, -5.9004716873168945, -5.147390842437744, -4.394309997558594, -3.6412291526794434, -2.888148307800293, -2.1350674629211426, -1.3819866180419922, -0.6289057731628418, 0.1241750717163086, 0.877255916595459, 1.6303367614746094, 2.3834176063537598, 3.13649845123291, 3.8895792961120605, 4.642660140991211, 5.395740985870361, 6.148821830749512, 6.901902675628662, 7.6549835205078125, 8.408063888549805, 9.161145210266113, 9.914226531982422, 10.667306900024414, 11.420387268066406, 12.173468589782715]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 6.0, 8.0, 5.0, 15.0, 9.0, 11.0, 18.0, 14.0, 10.0, 11.0, 23.0, 19.0, 19.0, 29.0, 21.0, 24.0, 42.0, 29.0, 32.0, 45.0, 43.0, 33.0, 31.0, 36.0, 34.0, 38.0, 30.0, 40.0, 33.0, 36.0, 26.0, 26.0, 23.0, 17.0, 17.0, 18.0, 20.0, 14.0, 22.0, 15.0, 16.0, 11.0, 6.0, 12.0, 6.0, 2.0, 3.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-46.38966751098633, -44.90962600708008, -43.42958450317383, -41.94954299926758, -40.46950149536133, -38.98945999145508, -37.50941848754883, -36.02937698364258, -34.54933547973633, -33.06929397583008, -31.589252471923828, -30.109210968017578, -28.629169464111328, -27.149127960205078, -25.669086456298828, -24.189044952392578, -22.709001541137695, -21.228960037231445, -19.748918533325195, -18.268877029418945, -16.788835525512695, -15.308794021606445, -13.828751564025879, -12.348710060119629, -10.868668556213379, -9.388627052307129, -7.908585548400879, -6.428543567657471, -4.948502063751221, -3.4684605598449707, -1.9884185791015625, -0.5083770751953125, 0.9716644287109375, 2.4517059326171875, 3.9317476749420166, 5.411789417266846, 6.891830921173096, 8.371871948242188, 9.851914405822754, 11.331955909729004, 12.811997413635254, 14.292038917541504, 15.772080421447754, 17.25212287902832, 18.73216438293457, 20.21220588684082, 21.69224739074707, 23.17228889465332, 24.65233039855957, 26.13237190246582, 27.61241340637207, 29.09245491027832, 30.57249641418457, 32.05253982543945, 33.5325813293457, 35.01262283325195, 36.4926643371582, 37.97270584106445, 39.4527473449707, 40.93278884887695, 42.4128303527832, 43.89287185668945, 45.3729133605957, 46.85295486450195, 48.3329963684082]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 7.0, 1.0, 6.0, 3.0, 5.0, 6.0, 9.0, 9.0, 9.0, 20.0, 19.0, 16.0, 28.0, 27.0, 19.0, 35.0, 23.0, 30.0, 40.0, 42.0, 43.0, 65.0, 37.0, 39.0, 47.0, 45.0, 50.0, 34.0, 36.0, 33.0, 29.0, 25.0, 17.0, 21.0, 23.0, 22.0, 13.0, 20.0, 8.0, 8.0, 15.0, 3.0, 5.0, 6.0, 5.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.09375, -5.87109375, -5.6484375, -5.42578125, -5.203125, -4.98046875, -4.7578125, -4.53515625, -4.3125, -4.08984375, -3.8671875, -3.64453125, -3.421875, -3.19921875, -2.9765625, -2.75390625, -2.53125, -2.30859375, -2.0859375, -1.86328125, -1.640625, -1.41796875, -1.1953125, -0.97265625, -0.75, -0.52734375, -0.3046875, -0.08203125, 0.140625, 0.36328125, 0.5859375, 0.80859375, 1.03125, 1.25390625, 1.4765625, 1.69921875, 1.921875, 2.14453125, 2.3671875, 2.58984375, 2.8125, 3.03515625, 3.2578125, 3.48046875, 3.703125, 3.92578125, 4.1484375, 4.37109375, 4.59375, 4.81640625, 5.0390625, 5.26171875, 5.484375, 5.70703125, 5.9296875, 6.15234375, 6.375, 6.59765625, 6.8203125, 7.04296875, 7.265625, 7.48828125, 7.7109375, 7.93359375, 8.15625]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 4.0, 2.0, 2.0, 5.0, 3.0, 3.0, 7.0, 2.0, 13.0, 12.0, 18.0, 12.0, 35.0, 29.0, 43.0, 29.0, 57.0, 95.0, 120.0, 246.0, 557.0, 1970.0, 11276.0, 205060.0, 3335625.0, 613287.0, 20985.0, 3108.0, 824.0, 296.0, 169.0, 97.0, 73.0, 43.0, 30.0, 31.0, 24.0, 26.0, 16.0, 12.0, 13.0, 4.0, 8.0, 6.0, 4.0, 5.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.5625, -18.828125, -18.09375, -17.359375, -16.625, -15.890625, -15.15625, -14.421875, -13.6875, -12.953125, -12.21875, -11.484375, -10.75, -10.015625, -9.28125, -8.546875, -7.8125, -7.078125, -6.34375, -5.609375, -4.875, -4.140625, -3.40625, -2.671875, -1.9375, -1.203125, -0.46875, 0.265625, 1.0, 1.734375, 2.46875, 3.203125, 3.9375, 4.671875, 5.40625, 6.140625, 6.875, 7.609375, 8.34375, 9.078125, 9.8125, 10.546875, 11.28125, 12.015625, 12.75, 13.484375, 14.21875, 14.953125, 15.6875, 16.421875, 17.15625, 17.890625, 18.625, 19.359375, 20.09375, 20.828125, 21.5625, 22.296875, 23.03125, 23.765625, 24.5, 25.234375, 25.96875, 26.703125, 27.4375]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 8.0, 7.0, 7.0, 7.0, 13.0, 14.0, 16.0, 38.0, 35.0, 55.0, 76.0, 91.0, 140.0, 197.0, 271.0, 377.0, 507.0, 531.0, 475.0, 380.0, 262.0, 146.0, 125.0, 88.0, 46.0, 40.0, 38.0, 30.0, 17.0, 12.0, 13.0, 3.0, 7.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.7578125, -13.3326416015625, -12.907470703125, -12.4822998046875, -12.05712890625, -11.6319580078125, -11.206787109375, -10.7816162109375, -10.3564453125, -9.9312744140625, -9.506103515625, -9.0809326171875, -8.65576171875, -8.2305908203125, -7.805419921875, -7.3802490234375, -6.955078125, -6.5299072265625, -6.104736328125, -5.6795654296875, -5.25439453125, -4.8292236328125, -4.404052734375, -3.9788818359375, -3.5537109375, -3.1285400390625, -2.703369140625, -2.2781982421875, -1.85302734375, -1.4278564453125, -1.002685546875, -0.5775146484375, -0.15234375, 0.2728271484375, 0.697998046875, 1.1231689453125, 1.54833984375, 1.9735107421875, 2.398681640625, 2.8238525390625, 3.2490234375, 3.6741943359375, 4.099365234375, 4.5245361328125, 4.94970703125, 5.3748779296875, 5.800048828125, 6.2252197265625, 6.650390625, 7.0755615234375, 7.500732421875, 7.9259033203125, 8.35107421875, 8.7762451171875, 9.201416015625, 9.6265869140625, 10.0517578125, 10.4769287109375, 10.902099609375, 11.3272705078125, 11.75244140625, 12.1776123046875, 12.602783203125, 13.0279541015625, 13.453125]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 8.0, 7.0, 13.0, 14.0, 25.0, 32.0, 46.0, 50.0, 74.0, 117.0, 156.0, 257.0, 317.0, 623.0, 5154.0, 3121429.0, 1061055.0, 3227.0, 495.0, 302.0, 248.0, 165.0, 120.0, 114.0, 68.0, 52.0, 38.0, 22.0, 11.0, 10.0, 15.0, 5.0, 6.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.375, -72.0458984375, -69.716796875, -67.3876953125, -65.05859375, -62.7294921875, -60.400390625, -58.0712890625, -55.7421875, -53.4130859375, -51.083984375, -48.7548828125, -46.42578125, -44.0966796875, -41.767578125, -39.4384765625, -37.109375, -34.7802734375, -32.451171875, -30.1220703125, -27.79296875, -25.4638671875, -23.134765625, -20.8056640625, -18.4765625, -16.1474609375, -13.818359375, -11.4892578125, -9.16015625, -6.8310546875, -4.501953125, -2.1728515625, 0.15625, 2.4853515625, 4.814453125, 7.1435546875, 9.47265625, 11.8017578125, 14.130859375, 16.4599609375, 18.7890625, 21.1181640625, 23.447265625, 25.7763671875, 28.10546875, 30.4345703125, 32.763671875, 35.0927734375, 37.421875, 39.7509765625, 42.080078125, 44.4091796875, 46.73828125, 49.0673828125, 51.396484375, 53.7255859375, 56.0546875, 58.3837890625, 60.712890625, 63.0419921875, 65.37109375, 67.7001953125, 70.029296875, 72.3583984375, 74.6875]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 11.0, 30.0, 92.0, 202.0, 281.0, 206.0, 116.0, 45.0, 19.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-171.51287841796875, -168.0595703125, -164.60626220703125, -161.15296936035156, -157.6996612548828, -154.24635314941406, -150.7930450439453, -147.33973693847656, -143.88644409179688, -140.43313598632812, -136.97982788085938, -133.5265350341797, -130.07322692871094, -126.61991882324219, -123.16661071777344, -119.71331024169922, -116.25999450683594, -112.80668640136719, -109.35338592529297, -105.90007781982422, -102.44677734375, -98.99346923828125, -95.5401611328125, -92.08686065673828, -88.63356018066406, -85.18025207519531, -81.7269515991211, -78.27364349365234, -74.82034301757812, -71.36703491210938, -67.91372680664062, -64.4604263305664, -61.007118225097656, -57.55381393432617, -54.10050964355469, -50.64720153808594, -47.19389724731445, -43.74059295654297, -40.287288665771484, -36.833984375, -33.38067626953125, -29.927371978759766, -26.47406578063965, -23.020761489868164, -19.567455291748047, -16.114151000976562, -12.660846710205078, -9.207540512084961, -5.754238128662109, -2.3009331226348877, 1.152371883392334, 4.605676651000977, 8.058981895446777, 11.512287139892578, 14.965591430664062, 18.41889762878418, 21.872201919555664, 25.32550621032715, 28.778812408447266, 32.23211669921875, 35.685420989990234, 39.13872528076172, 42.59203338623047, 46.04533767700195, 49.49864196777344]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 6.0, 5.0, 2.0, 11.0, 15.0, 17.0, 13.0, 17.0, 18.0, 19.0, 15.0, 20.0, 24.0, 28.0, 33.0, 31.0, 31.0, 39.0, 45.0, 37.0, 54.0, 38.0, 47.0, 51.0, 36.0, 38.0, 37.0, 24.0, 30.0, 31.0, 19.0, 20.0, 22.0, 13.0, 23.0, 14.0, 18.0, 17.0, 10.0, 10.0, 6.0, 4.0, 6.0, 7.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-38.41998291015625, -37.218482971191406, -36.01698303222656, -34.81548309326172, -33.613983154296875, -32.412479400634766, -31.210979461669922, -30.009479522705078, -28.807979583740234, -27.60647964477539, -26.404979705810547, -25.20347785949707, -24.001977920532227, -22.800477981567383, -21.598976135253906, -20.397476196289062, -19.19597625732422, -17.994476318359375, -16.79297637939453, -15.591474533081055, -14.389974594116211, -13.188474655151367, -11.986973762512207, -10.785472869873047, -9.583972930908203, -8.38247299194336, -7.180972099304199, -5.979471683502197, -4.777971267700195, -3.5764708518981934, -2.3749704360961914, -1.1734695434570312, 0.0280303955078125, 1.2295308113098145, 2.4310312271118164, 3.6325316429138184, 4.83403205871582, 6.035532474517822, 7.237032890319824, 8.438533782958984, 9.640033721923828, 10.841533660888672, 12.043034553527832, 13.244535446166992, 14.446035385131836, 15.64753532409668, 16.849037170410156, 18.050537109375, 19.252037048339844, 20.453536987304688, 21.65503692626953, 22.856538772583008, 24.05803871154785, 25.259538650512695, 26.461040496826172, 27.662540435791016, 28.86404037475586, 30.065540313720703, 31.267040252685547, 32.46854019165039, 33.6700439453125, 34.871543884277344, 36.07304382324219, 37.27454376220703, 38.476043701171875]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 6.0, 7.0, 10.0, 5.0, 9.0, 7.0, 12.0, 10.0, 13.0, 15.0, 21.0, 27.0, 29.0, 22.0, 36.0, 27.0, 34.0, 42.0, 48.0, 41.0, 41.0, 50.0, 30.0, 44.0, 40.0, 41.0, 42.0, 30.0, 36.0, 31.0, 26.0, 23.0, 21.0, 20.0, 19.0, 10.0, 17.0, 9.0, 11.0, 7.0, 10.0, 4.0, 6.0, 5.0, 4.0, 2.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.3359375, -6.125, -5.9140625, -5.703125, -5.4921875, -5.28125, -5.0703125, -4.859375, -4.6484375, -4.4375, -4.2265625, -4.015625, -3.8046875, -3.59375, -3.3828125, -3.171875, -2.9609375, -2.75, -2.5390625, -2.328125, -2.1171875, -1.90625, -1.6953125, -1.484375, -1.2734375, -1.0625, -0.8515625, -0.640625, -0.4296875, -0.21875, -0.0078125, 0.203125, 0.4140625, 0.625, 0.8359375, 1.046875, 1.2578125, 1.46875, 1.6796875, 1.890625, 2.1015625, 2.3125, 2.5234375, 2.734375, 2.9453125, 3.15625, 3.3671875, 3.578125, 3.7890625, 4.0, 4.2109375, 4.421875, 4.6328125, 4.84375, 5.0546875, 5.265625, 5.4765625, 5.6875, 5.8984375, 6.109375, 6.3203125, 6.53125, 6.7421875, 6.953125, 7.1640625]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 3.0, 16.0, 26.0, 26.0, 52.0, 67.0, 100.0, 174.0, 260.0, 418.0, 710.0, 1189.0, 1977.0, 3160.0, 5145.0, 8273.0, 12600.0, 20089.0, 31966.0, 52147.0, 85864.0, 137606.0, 187584.0, 177016.0, 122884.0, 76292.0, 45968.0, 28269.0, 17873.0, 11415.0, 7367.0, 4664.0, 2928.0, 1660.0, 1098.0, 649.0, 414.0, 232.0, 141.0, 76.0, 53.0, 35.0, 30.0, 16.0, 14.0, 4.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.7509765625, -0.7281341552734375, -0.705291748046875, -0.6824493408203125, -0.65960693359375, -0.6367645263671875, -0.613922119140625, -0.5910797119140625, -0.5682373046875, -0.5453948974609375, -0.522552490234375, -0.4997100830078125, -0.47686767578125, -0.4540252685546875, -0.431182861328125, -0.4083404541015625, -0.385498046875, -0.3626556396484375, -0.339813232421875, -0.3169708251953125, -0.29412841796875, -0.2712860107421875, -0.248443603515625, -0.2256011962890625, -0.2027587890625, -0.1799163818359375, -0.157073974609375, -0.1342315673828125, -0.11138916015625, -0.0885467529296875, -0.065704345703125, -0.0428619384765625, -0.02001953125, 0.0028228759765625, 0.025665283203125, 0.0485076904296875, 0.07135009765625, 0.0941925048828125, 0.117034912109375, 0.1398773193359375, 0.1627197265625, 0.1855621337890625, 0.208404541015625, 0.2312469482421875, 0.25408935546875, 0.2769317626953125, 0.299774169921875, 0.3226165771484375, 0.345458984375, 0.3683013916015625, 0.391143798828125, 0.4139862060546875, 0.43682861328125, 0.4596710205078125, 0.482513427734375, 0.5053558349609375, 0.5281982421875, 0.5510406494140625, 0.573883056640625, 0.5967254638671875, 0.61956787109375, 0.6424102783203125, 0.665252685546875, 0.6880950927734375, 0.7109375]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 3.0, 6.0, 8.0, 14.0, 18.0, 12.0, 14.0, 18.0, 17.0, 21.0, 20.0, 23.0, 28.0, 45.0, 35.0, 29.0, 35.0, 34.0, 55.0, 48.0, 1061.0, 39.0, 45.0, 47.0, 38.0, 43.0, 33.0, 31.0, 32.0, 23.0, 21.0, 21.0, 12.0, 17.0, 7.0, 12.0, 12.0, 11.0, 13.0, 4.0, 5.0, 4.0, 4.0, 3.0, 3.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.12109375, -3.98590087890625, -3.8507080078125, -3.71551513671875, -3.580322265625, -3.44512939453125, -3.3099365234375, -3.17474365234375, -3.03955078125, -2.90435791015625, -2.7691650390625, -2.63397216796875, -2.498779296875, -2.36358642578125, -2.2283935546875, -2.09320068359375, -1.9580078125, -1.82281494140625, -1.6876220703125, -1.55242919921875, -1.417236328125, -1.28204345703125, -1.1468505859375, -1.01165771484375, -0.87646484375, -0.74127197265625, -0.6060791015625, -0.47088623046875, -0.335693359375, -0.20050048828125, -0.0653076171875, 0.06988525390625, 0.205078125, 0.34027099609375, 0.4754638671875, 0.61065673828125, 0.745849609375, 0.88104248046875, 1.0162353515625, 1.15142822265625, 1.28662109375, 1.42181396484375, 1.5570068359375, 1.69219970703125, 1.827392578125, 1.96258544921875, 2.0977783203125, 2.23297119140625, 2.3681640625, 2.50335693359375, 2.6385498046875, 2.77374267578125, 2.908935546875, 3.04412841796875, 3.1793212890625, 3.31451416015625, 3.44970703125, 3.58489990234375, 3.7200927734375, 3.85528564453125, 3.990478515625, 4.12567138671875, 4.2608642578125, 4.39605712890625, 4.53125]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 8.0, 3.0, 9.0, 18.0, 19.0, 25.0, 66.0, 97.0, 153.0, 249.0, 440.0, 731.0, 1157.0, 1952.0, 3181.0, 5565.0, 9110.0, 15496.0, 25759.0, 43715.0, 71316.0, 112372.0, 159275.0, 1227935.0, 151684.0, 104017.0, 65222.0, 39335.0, 23240.0, 14023.0, 8394.0, 5032.0, 3048.0, 1811.0, 1042.0, 643.0, 376.0, 218.0, 165.0, 83.0, 49.0, 46.0, 23.0, 21.0, 4.0, 8.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.578125, -0.5597152709960938, -0.5413055419921875, -0.5228958129882812, -0.504486083984375, -0.48607635498046875, -0.4676666259765625, -0.44925689697265625, -0.43084716796875, -0.41243743896484375, -0.3940277099609375, -0.37561798095703125, -0.357208251953125, -0.33879852294921875, -0.3203887939453125, -0.30197906494140625, -0.2835693359375, -0.26515960693359375, -0.2467498779296875, -0.22834014892578125, -0.209930419921875, -0.19152069091796875, -0.1731109619140625, -0.15470123291015625, -0.13629150390625, -0.11788177490234375, -0.0994720458984375, -0.08106231689453125, -0.062652587890625, -0.04424285888671875, -0.0258331298828125, -0.00742340087890625, 0.010986328125, 0.02939605712890625, 0.0478057861328125, 0.06621551513671875, 0.084625244140625, 0.10303497314453125, 0.1214447021484375, 0.13985443115234375, 0.15826416015625, 0.17667388916015625, 0.1950836181640625, 0.21349334716796875, 0.231903076171875, 0.25031280517578125, 0.2687225341796875, 0.28713226318359375, 0.3055419921875, 0.32395172119140625, 0.3423614501953125, 0.36077117919921875, 0.379180908203125, 0.39759063720703125, 0.4160003662109375, 0.43441009521484375, 0.45281982421875, 0.47122955322265625, 0.4896392822265625, 0.5080490112304688, 0.526458740234375, 0.5448684692382812, 0.5632781982421875, 0.5816879272460938, 0.60009765625]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 2.0, 1.0, 2.0, 4.0, 2.0, 1.0, 6.0, 8.0, 5.0, 11.0, 10.0, 20.0, 21.0, 22.0, 32.0, 29.0, 38.0, 39.0, 43.0, 45.0, 43.0, 62.0, 68.0, 74.0, 69.0, 50.0, 35.0, 36.0, 39.0, 34.0, 28.0, 27.0, 21.0, 18.0, 15.0, 5.0, 10.0, 6.0, 9.0, 4.0, 2.0, 2.0, 4.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.003307342529296875, -0.0032024383544921875, -0.0030975341796875, -0.0029926300048828125, -0.002887725830078125, -0.0027828216552734375, -0.00267791748046875, -0.0025730133056640625, -0.002468109130859375, -0.0023632049560546875, -0.00225830078125, -0.0021533966064453125, -0.002048492431640625, -0.0019435882568359375, -0.00183868408203125, -0.0017337799072265625, -0.001628875732421875, -0.0015239715576171875, -0.0014190673828125, -0.0013141632080078125, -0.001209259033203125, -0.0011043548583984375, -0.00099945068359375, -0.0008945465087890625, -0.000789642333984375, -0.0006847381591796875, -0.000579833984375, -0.0004749298095703125, -0.000370025634765625, -0.0002651214599609375, -0.00016021728515625, -5.53131103515625e-05, 4.9591064453125e-05, 0.0001544952392578125, 0.0002593994140625, 0.0003643035888671875, 0.000469207763671875, 0.0005741119384765625, 0.00067901611328125, 0.0007839202880859375, 0.000888824462890625, 0.0009937286376953125, 0.0010986328125, 0.0012035369873046875, 0.001308441162109375, 0.0014133453369140625, 0.00151824951171875, 0.0016231536865234375, 0.001728057861328125, 0.0018329620361328125, 0.0019378662109375, 0.0020427703857421875, 0.002147674560546875, 0.0022525787353515625, 0.00235748291015625, 0.0024623870849609375, 0.002567291259765625, 0.0026721954345703125, 0.002777099609375, 0.0028820037841796875, 0.002986907958984375, 0.0030918121337890625, 0.00319671630859375, 0.0033016204833984375, 0.003406524658203125]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 2.0, 3.0, 10.0, 8.0, 8.0, 12.0, 14.0, 27.0, 29.0, 28.0, 44.0, 56.0, 83.0, 100.0, 139.0, 265.0, 619.0, 9037.0, 936400.0, 99086.0, 1547.0, 355.0, 190.0, 128.0, 71.0, 72.0, 48.0, 37.0, 33.0, 22.0, 19.0, 14.0, 9.0, 7.0, 10.0, 3.0, 3.0, 2.0, 2.0, 3.0, 0.0, 4.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0784912109375, -0.07609367370605469, -0.07369613647460938, -0.07129859924316406, -0.06890106201171875, -0.06650352478027344, -0.06410598754882812, -0.06170845031738281, -0.0593109130859375, -0.05691337585449219, -0.054515838623046875, -0.05211830139160156, -0.04972076416015625, -0.04732322692871094, -0.044925689697265625, -0.04252815246582031, -0.040130615234375, -0.03773307800292969, -0.035335540771484375, -0.03293800354003906, -0.03054046630859375, -0.028142929077148438, -0.025745391845703125, -0.023347854614257812, -0.0209503173828125, -0.018552780151367188, -0.016155242919921875, -0.013757705688476562, -0.01136016845703125, -0.008962631225585938, -0.006565093994140625, -0.0041675567626953125, -0.00177001953125, 0.0006275177001953125, 0.003025054931640625, 0.0054225921630859375, 0.00782012939453125, 0.010217666625976562, 0.012615203857421875, 0.015012741088867188, 0.0174102783203125, 0.019807815551757812, 0.022205352783203125, 0.024602890014648438, 0.02700042724609375, 0.029397964477539062, 0.031795501708984375, 0.03419303894042969, 0.036590576171875, 0.03898811340332031, 0.041385650634765625, 0.04378318786621094, 0.04618072509765625, 0.04857826232910156, 0.050975799560546875, 0.05337333679199219, 0.0557708740234375, 0.05816841125488281, 0.060565948486328125, 0.06296348571777344, 0.06536102294921875, 0.06775856018066406, 0.07015609741210938, 0.07255363464355469, 0.074951171875]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 20.0, 140.0, 533.0, 246.0, 58.0, 10.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.028252651914954185, -0.027736257761716843, -0.0272198636084795, -0.026703469455242157, -0.026187075302004814, -0.02567068114876747, -0.02515428699553013, -0.024637892842292786, -0.024121496826410294, -0.02360510267317295, -0.023088708519935608, -0.022572314366698265, -0.022055920213460922, -0.02153952606022358, -0.021023131906986237, -0.020506735891103745, -0.01999034360051155, -0.019473949447274208, -0.018957555294036865, -0.018441161140799522, -0.01792476698756218, -0.017408372834324837, -0.016891978681087494, -0.016375582665205002, -0.015859190374612808, -0.015342796221375465, -0.014826402068138123, -0.01431000791490078, -0.013793613761663437, -0.013277219608426094, -0.012760824523866177, -0.012244430370628834, -0.011728035286068916, -0.011211641132831573, -0.01069524697959423, -0.010178852826356888, -0.009662458673119545, -0.009146064519882202, -0.008629669435322285, -0.008113275282084942, -0.007596881128847599, -0.007080486975610256, -0.006564092822372913, -0.006047698203474283, -0.00553130405023694, -0.0050149098969995975, -0.004498515278100967, -0.003982121124863625, -0.0034657269716262817, -0.002949332818388939, -0.0024329384323209524, -0.0019165441626682878, -0.001400149893015623, -0.0008837557397782803, -0.00036736135371029377, 0.00014903303235769272, 0.0006654271855950356, 0.0011818214552477002, 0.0016982157249003649, 0.0022146101109683514, 0.002731004264205694, 0.003247398417443037, 0.0037637928035110235, 0.00428018718957901, 0.004796581342816353]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 6.0, 3.0, 7.0, 11.0, 14.0, 15.0, 27.0, 20.0, 35.0, 23.0, 26.0, 35.0, 37.0, 31.0, 44.0, 50.0, 36.0, 40.0, 49.0, 46.0, 51.0, 52.0, 38.0, 45.0, 30.0, 22.0, 34.0, 41.0, 17.0, 22.0, 20.0, 21.0, 11.0, 11.0, 9.0, 4.0, 7.0, 7.0, 4.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0024050474166870117, -0.002334785647690296, -0.0022645238786935806, -0.002194262109696865, -0.0021240003407001495, -0.002053738571703434, -0.0019834768027067184, -0.001913215033710003, -0.0018429532647132874, -0.0017726914957165718, -0.0017024297267198563, -0.0016321679577231407, -0.0015619061887264252, -0.0014916444197297096, -0.001421382650732994, -0.0013511208817362785, -0.001280859112739563, -0.0012105973437428474, -0.001140335574746132, -0.0010700738057494164, -0.0009998120367527008, -0.0009295502677559853, -0.0008592884987592697, -0.0007890267297625542, -0.0007187649607658386, -0.0006485031917691231, -0.0005782414227724075, -0.000507979653775692, -0.00043771788477897644, -0.0003674561157822609, -0.00029719434678554535, -0.0002269325777888298, -0.00015667080879211426, -8.640903979539871e-05, -1.6147270798683167e-05, 5.411449819803238e-05, 0.00012437626719474792, 0.00019463803619146347, 0.000264899805188179, 0.00033516157418489456, 0.0004054233431816101, 0.00047568511217832565, 0.0005459468811750412, 0.0006162086501717567, 0.0006864704191684723, 0.0007567321881651878, 0.0008269939571619034, 0.0008972557261586189, 0.0009675174951553345, 0.00103777926415205, 0.0011080410331487656, 0.0011783028021454811, 0.0012485645711421967, 0.0013188263401389122, 0.0013890881091356277, 0.0014593498781323433, 0.0015296116471290588, 0.0015998734161257744, 0.00167013518512249, 0.0017403969541192055, 0.001810658723115921, 0.0018809204921126366, 0.0019511822611093521, 0.0020214440301060677, 0.002091705799102783]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 6.0, 7.0, 10.0, 5.0, 9.0, 7.0, 12.0, 10.0, 13.0, 15.0, 21.0, 27.0, 29.0, 22.0, 36.0, 27.0, 34.0, 42.0, 47.0, 42.0, 41.0, 50.0, 30.0, 44.0, 40.0, 41.0, 42.0, 30.0, 36.0, 31.0, 26.0, 23.0, 21.0, 20.0, 19.0, 10.0, 17.0, 9.0, 11.0, 7.0, 10.0, 4.0, 6.0, 5.0, 4.0, 2.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.3359375, -6.125, -5.9140625, -5.703125, -5.4921875, -5.28125, -5.0703125, -4.859375, -4.6484375, -4.4375, -4.2265625, -4.015625, -3.8046875, -3.59375, -3.3828125, -3.171875, -2.9609375, -2.75, -2.5390625, -2.328125, -2.1171875, -1.90625, -1.6953125, -1.484375, -1.2734375, -1.0625, -0.8515625, -0.640625, -0.4296875, -0.21875, -0.0078125, 0.203125, 0.4140625, 0.625, 0.8359375, 1.046875, 1.2578125, 1.46875, 1.6796875, 1.890625, 2.1015625, 2.3125, 2.5234375, 2.734375, 2.9453125, 3.15625, 3.3671875, 3.578125, 3.7890625, 4.0, 4.2109375, 4.421875, 4.6328125, 4.84375, 5.0546875, 5.265625, 5.4765625, 5.6875, 5.8984375, 6.109375, 6.3203125, 6.53125, 6.7421875, 6.953125, 7.1640625]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 8.0, 11.0, 11.0, 10.0, 15.0, 15.0, 11.0, 37.0, 30.0, 41.0, 60.0, 75.0, 114.0, 130.0, 232.0, 344.0, 633.0, 1336.0, 3459.0, 13149.0, 74670.0, 747616.0, 174254.0, 22854.0, 5562.0, 1778.0, 786.0, 421.0, 260.0, 168.0, 114.0, 69.0, 61.0, 51.0, 40.0, 27.0, 24.0, 12.0, 14.0, 18.0, 8.0, 6.0, 7.0, 3.0, 5.0, 2.0, 3.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.3828125, -10.999267578125, -10.61572265625, -10.232177734375, -9.8486328125, -9.465087890625, -9.08154296875, -8.697998046875, -8.314453125, -7.930908203125, -7.54736328125, -7.163818359375, -6.7802734375, -6.396728515625, -6.01318359375, -5.629638671875, -5.24609375, -4.862548828125, -4.47900390625, -4.095458984375, -3.7119140625, -3.328369140625, -2.94482421875, -2.561279296875, -2.177734375, -1.794189453125, -1.41064453125, -1.027099609375, -0.6435546875, -0.260009765625, 0.12353515625, 0.507080078125, 0.890625, 1.274169921875, 1.65771484375, 2.041259765625, 2.4248046875, 2.808349609375, 3.19189453125, 3.575439453125, 3.958984375, 4.342529296875, 4.72607421875, 5.109619140625, 5.4931640625, 5.876708984375, 6.26025390625, 6.643798828125, 7.02734375, 7.410888671875, 7.79443359375, 8.177978515625, 8.5615234375, 8.945068359375, 9.32861328125, 9.712158203125, 10.095703125, 10.479248046875, 10.86279296875, 11.246337890625, 11.6298828125, 12.013427734375, 12.39697265625, 12.780517578125, 13.1640625]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 2.0, 1.0, 5.0, 8.0, 3.0, 7.0, 8.0, 11.0, 8.0, 8.0, 20.0, 20.0, 25.0, 33.0, 33.0, 24.0, 22.0, 35.0, 41.0, 44.0, 63.0, 155.0, 1776.0, 204.0, 59.0, 45.0, 52.0, 49.0, 47.0, 35.0, 38.0, 29.0, 29.0, 12.0, 26.0, 19.0, 11.0, 10.0, 11.0, 8.0, 3.0, 8.0, 2.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.125, -18.457275390625, -17.78955078125, -17.121826171875, -16.4541015625, -15.786376953125, -15.11865234375, -14.450927734375, -13.783203125, -13.115478515625, -12.44775390625, -11.780029296875, -11.1123046875, -10.444580078125, -9.77685546875, -9.109130859375, -8.44140625, -7.773681640625, -7.10595703125, -6.438232421875, -5.7705078125, -5.102783203125, -4.43505859375, -3.767333984375, -3.099609375, -2.431884765625, -1.76416015625, -1.096435546875, -0.4287109375, 0.239013671875, 0.90673828125, 1.574462890625, 2.2421875, 2.909912109375, 3.57763671875, 4.245361328125, 4.9130859375, 5.580810546875, 6.24853515625, 6.916259765625, 7.583984375, 8.251708984375, 8.91943359375, 9.587158203125, 10.2548828125, 10.922607421875, 11.59033203125, 12.258056640625, 12.92578125, 13.593505859375, 14.26123046875, 14.928955078125, 15.5966796875, 16.264404296875, 16.93212890625, 17.599853515625, 18.267578125, 18.935302734375, 19.60302734375, 20.270751953125, 20.9384765625, 21.606201171875, 22.27392578125, 22.941650390625, 23.609375]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 3.0, 9.0, 6.0, 11.0, 10.0, 12.0, 11.0, 27.0, 24.0, 30.0, 44.0, 48.0, 67.0, 65.0, 115.0, 177.0, 313.0, 801.0, 14052.0, 3121063.0, 7328.0, 636.0, 304.0, 141.0, 87.0, 59.0, 47.0, 43.0, 33.0, 31.0, 24.0, 18.0, 7.0, 15.0, 10.0, 7.0, 6.0, 7.0, 7.0, 0.0, 5.0, 1.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-71.125, -69.0595703125, -66.994140625, -64.9287109375, -62.86328125, -60.7978515625, -58.732421875, -56.6669921875, -54.6015625, -52.5361328125, -50.470703125, -48.4052734375, -46.33984375, -44.2744140625, -42.208984375, -40.1435546875, -38.078125, -36.0126953125, -33.947265625, -31.8818359375, -29.81640625, -27.7509765625, -25.685546875, -23.6201171875, -21.5546875, -19.4892578125, -17.423828125, -15.3583984375, -13.29296875, -11.2275390625, -9.162109375, -7.0966796875, -5.03125, -2.9658203125, -0.900390625, 1.1650390625, 3.23046875, 5.2958984375, 7.361328125, 9.4267578125, 11.4921875, 13.5576171875, 15.623046875, 17.6884765625, 19.75390625, 21.8193359375, 23.884765625, 25.9501953125, 28.015625, 30.0810546875, 32.146484375, 34.2119140625, 36.27734375, 38.3427734375, 40.408203125, 42.4736328125, 44.5390625, 46.6044921875, 48.669921875, 50.7353515625, 52.80078125, 54.8662109375, 56.931640625, 58.9970703125, 61.0625]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 110.0, 746.0, 157.0, 5.0], "bins": [-245.0657196044922, -241.08157348632812, -237.09744262695312, -233.11329650878906, -229.129150390625, -225.14500427246094, -221.16085815429688, -217.17672729492188, -213.1925811767578, -209.20843505859375, -205.22430419921875, -201.2401580810547, -197.25601196289062, -193.27186584472656, -189.2877197265625, -185.3035888671875, -181.31944274902344, -177.33529663085938, -173.35116577148438, -169.3670196533203, -165.38287353515625, -161.3987274169922, -157.41458129882812, -153.43045043945312, -149.44630432128906, -145.462158203125, -141.47802734375, -137.49388122558594, -133.50973510742188, -129.5255889892578, -125.54145050048828, -121.55731201171875, -117.57316589355469, -113.58901977539062, -109.6048812866211, -105.62074279785156, -101.6365966796875, -97.65245056152344, -93.6683120727539, -89.68417358398438, -85.70002746582031, -81.71588134765625, -77.73174285888672, -73.74760437011719, -69.76345825195312, -65.77931213378906, -61.79517364501953, -57.811031341552734, -53.82688522338867, -49.842742919921875, -45.85860061645508, -41.87445831298828, -37.890316009521484, -33.90617370605469, -29.92203140258789, -25.937889099121094, -21.953746795654297, -17.9696044921875, -13.985462188720703, -10.001319885253906, -6.017177581787109, -2.0330352783203125, 1.9511070251464844, 5.935249328613281, 9.919390678405762]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 6.0, 2.0, 8.0, 11.0, 7.0, 6.0, 12.0, 17.0, 16.0, 16.0, 19.0, 17.0, 30.0, 28.0, 18.0, 40.0, 34.0, 32.0, 33.0, 36.0, 35.0, 39.0, 41.0, 40.0, 33.0, 45.0, 40.0, 31.0, 38.0, 27.0, 21.0, 32.0, 27.0, 17.0, 20.0, 19.0, 16.0, 19.0, 10.0, 12.0, 11.0, 8.0, 7.0, 3.0, 7.0, 4.0, 7.0, 3.0, 2.0, 1.0, 2.0, 2.0], "bins": [-62.56318664550781, -60.72850036621094, -58.89381408691406, -57.05912780761719, -55.22444152832031, -53.38975524902344, -51.55506896972656, -49.72038269042969, -47.88569641113281, -46.05101013183594, -44.21632385253906, -42.38163757324219, -40.54695129394531, -38.71226501464844, -36.87757873535156, -35.04289245605469, -33.20820236206055, -31.373516082763672, -29.538829803466797, -27.704143524169922, -25.869457244873047, -24.034770965576172, -22.200082778930664, -20.36539649963379, -18.530710220336914, -16.69602394104004, -14.861337661743164, -13.026650428771973, -11.191964149475098, -9.357277870178223, -7.522590637207031, -5.687904357910156, -3.8532180786132812, -2.018531560897827, -0.18384504318237305, 1.6508417129516602, 3.485527992248535, 5.32021427154541, 7.154901504516602, 8.989587783813477, 10.824274063110352, 12.658960342407227, 14.493646621704102, 16.32833480834961, 18.163021087646484, 19.99770736694336, 21.832393646240234, 23.66707992553711, 25.501766204833984, 27.33645248413086, 29.171138763427734, 31.00582504272461, 32.840511322021484, 34.67519760131836, 36.5098876953125, 38.344573974609375, 40.17926025390625, 42.013946533203125, 43.8486328125, 45.683319091796875, 47.51800537109375, 49.352691650390625, 51.1873779296875, 53.022064208984375, 54.85675048828125]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 3.0, 7.0, 5.0, 4.0, 2.0, 11.0, 6.0, 10.0, 13.0, 7.0, 22.0, 22.0, 21.0, 26.0, 24.0, 32.0, 36.0, 30.0, 48.0, 42.0, 48.0, 41.0, 50.0, 36.0, 44.0, 37.0, 48.0, 42.0, 36.0, 38.0, 30.0, 23.0, 24.0, 21.0, 19.0, 16.0, 20.0, 5.0, 6.0, 14.0, 10.0, 9.0, 6.0, 3.0, 2.0, 5.0, 1.0, 2.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.21875, -6.98614501953125, -6.7535400390625, -6.52093505859375, -6.288330078125, -6.05572509765625, -5.8231201171875, -5.59051513671875, -5.35791015625, -5.12530517578125, -4.8927001953125, -4.66009521484375, -4.427490234375, -4.19488525390625, -3.9622802734375, -3.72967529296875, -3.4970703125, -3.26446533203125, -3.0318603515625, -2.79925537109375, -2.566650390625, -2.33404541015625, -2.1014404296875, -1.86883544921875, -1.63623046875, -1.40362548828125, -1.1710205078125, -0.93841552734375, -0.705810546875, -0.47320556640625, -0.2406005859375, -0.00799560546875, 0.224609375, 0.45721435546875, 0.6898193359375, 0.92242431640625, 1.155029296875, 1.38763427734375, 1.6202392578125, 1.85284423828125, 2.08544921875, 2.31805419921875, 2.5506591796875, 2.78326416015625, 3.015869140625, 3.24847412109375, 3.4810791015625, 3.71368408203125, 3.9462890625, 4.17889404296875, 4.4114990234375, 4.64410400390625, 4.876708984375, 5.10931396484375, 5.3419189453125, 5.57452392578125, 5.80712890625, 6.03973388671875, 6.2723388671875, 6.50494384765625, 6.737548828125, 6.97015380859375, 7.2027587890625, 7.43536376953125, 7.66796875]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 5.0, 3.0, 6.0, 4.0, 9.0, 4.0, 11.0, 10.0, 17.0, 23.0, 38.0, 34.0, 56.0, 79.0, 136.0, 203.0, 287.0, 466.0, 763.0, 1361.0, 2472.0, 4900.0, 10476.0, 26248.0, 86239.0, 331269.0, 1018546.0, 1557390.0, 808837.0, 239734.0, 64975.0, 21212.0, 8755.0, 4182.0, 2266.0, 1186.0, 713.0, 471.0, 277.0, 172.0, 119.0, 103.0, 65.0, 45.0, 36.0, 26.0, 19.0, 13.0, 13.0, 7.0, 7.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-8.328125, -8.062744140625, -7.79736328125, -7.531982421875, -7.2666015625, -7.001220703125, -6.73583984375, -6.470458984375, -6.205078125, -5.939697265625, -5.67431640625, -5.408935546875, -5.1435546875, -4.878173828125, -4.61279296875, -4.347412109375, -4.08203125, -3.816650390625, -3.55126953125, -3.285888671875, -3.0205078125, -2.755126953125, -2.48974609375, -2.224365234375, -1.958984375, -1.693603515625, -1.42822265625, -1.162841796875, -0.8974609375, -0.632080078125, -0.36669921875, -0.101318359375, 0.1640625, 0.429443359375, 0.69482421875, 0.960205078125, 1.2255859375, 1.490966796875, 1.75634765625, 2.021728515625, 2.287109375, 2.552490234375, 2.81787109375, 3.083251953125, 3.3486328125, 3.614013671875, 3.87939453125, 4.144775390625, 4.41015625, 4.675537109375, 4.94091796875, 5.206298828125, 5.4716796875, 5.737060546875, 6.00244140625, 6.267822265625, 6.533203125, 6.798583984375, 7.06396484375, 7.329345703125, 7.5947265625, 7.860107421875, 8.12548828125, 8.390869140625, 8.65625]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 12.0, 5.0, 22.0, 36.0, 50.0, 100.0, 113.0, 179.0, 268.0, 408.0, 621.0, 687.0, 532.0, 366.0, 258.0, 144.0, 97.0, 60.0, 52.0, 23.0, 19.0, 8.0, 6.0, 8.0, 7.0, 1.0, 1.0], "bins": [-29.265625, -28.6602783203125, -28.054931640625, -27.4495849609375, -26.84423828125, -26.2388916015625, -25.633544921875, -25.0281982421875, -24.4228515625, -23.8175048828125, -23.212158203125, -22.6068115234375, -22.00146484375, -21.3961181640625, -20.790771484375, -20.1854248046875, -19.580078125, -18.9747314453125, -18.369384765625, -17.7640380859375, -17.15869140625, -16.5533447265625, -15.947998046875, -15.3426513671875, -14.7373046875, -14.1319580078125, -13.526611328125, -12.9212646484375, -12.31591796875, -11.7105712890625, -11.105224609375, -10.4998779296875, -9.89453125, -9.2891845703125, -8.683837890625, -8.0784912109375, -7.47314453125, -6.8677978515625, -6.262451171875, -5.6571044921875, -5.0517578125, -4.4464111328125, -3.841064453125, -3.2357177734375, -2.63037109375, -2.0250244140625, -1.419677734375, -0.8143310546875, -0.208984375, 0.3963623046875, 1.001708984375, 1.6070556640625, 2.21240234375, 2.8177490234375, 3.423095703125, 4.0284423828125, 4.6337890625, 5.2391357421875, 5.844482421875, 6.4498291015625, 7.05517578125, 7.6605224609375, 8.265869140625, 8.8712158203125, 9.4765625]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 9.0, 15.0, 17.0, 32.0, 65.0, 103.0, 158.0, 282.0, 440.0, 1007.0, 7899.0, 4055565.0, 125536.0, 1680.0, 608.0, 357.0, 223.0, 125.0, 72.0, 44.0, 29.0, 16.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.9375, -60.2841796875, -57.630859375, -54.9775390625, -52.32421875, -49.6708984375, -47.017578125, -44.3642578125, -41.7109375, -39.0576171875, -36.404296875, -33.7509765625, -31.09765625, -28.4443359375, -25.791015625, -23.1376953125, -20.484375, -17.8310546875, -15.177734375, -12.5244140625, -9.87109375, -7.2177734375, -4.564453125, -1.9111328125, 0.7421875, 3.3955078125, 6.048828125, 8.7021484375, 11.35546875, 14.0087890625, 16.662109375, 19.3154296875, 21.96875, 24.6220703125, 27.275390625, 29.9287109375, 32.58203125, 35.2353515625, 37.888671875, 40.5419921875, 43.1953125, 45.8486328125, 48.501953125, 51.1552734375, 53.80859375, 56.4619140625, 59.115234375, 61.7685546875, 64.421875, 67.0751953125, 69.728515625, 72.3818359375, 75.03515625, 77.6884765625, 80.341796875, 82.9951171875, 85.6484375, 88.3017578125, 90.955078125, 93.6083984375, 96.26171875, 98.9150390625, 101.568359375, 104.2216796875, 106.875]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 342.0, 676.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1392.4459228515625, -1367.169921875, -1341.89404296875, -1316.6180419921875, -1291.3421630859375, -1266.066162109375, -1240.790283203125, -1215.5142822265625, -1190.2384033203125, -1164.96240234375, -1139.6865234375, -1114.4105224609375, -1089.1346435546875, -1063.858642578125, -1038.582763671875, -1013.3067626953125, -988.0308227539062, -962.7548828125, -937.4789428710938, -912.2030029296875, -886.9270629882812, -861.651123046875, -836.3751220703125, -811.0992431640625, -785.8232421875, -760.5473022460938, -735.2713623046875, -709.9954223632812, -684.719482421875, -659.4435424804688, -634.1676025390625, -608.8916015625, -583.61572265625, -558.3397827148438, -533.0638427734375, -507.78790283203125, -482.511962890625, -457.23602294921875, -431.9600524902344, -406.6841125488281, -381.408203125, -356.13226318359375, -330.8563232421875, -305.58038330078125, -280.304443359375, -255.0284881591797, -229.75253295898438, -204.47659301757812, -179.2006378173828, -153.92469787597656, -128.64874267578125, -103.372802734375, -78.09686279296875, -52.8209228515625, -27.544967651367188, -2.2690277099609375, 23.006912231445312, 48.28285598754883, 73.55879974365234, 98.83474731445312, 124.11068725585938, 149.38662719726562, 174.66258239746094, 199.9385223388672, 225.21446228027344]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 8.0, 4.0, 9.0, 15.0, 18.0, 12.0, 26.0, 31.0, 27.0, 43.0, 48.0, 51.0, 50.0, 58.0, 58.0, 62.0, 62.0, 47.0, 55.0, 50.0, 56.0, 45.0, 33.0, 40.0, 26.0, 20.0, 23.0, 14.0, 5.0, 5.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.742645263671875, -43.7707633972168, -41.79888153076172, -39.82699966430664, -37.85511779785156, -35.88323974609375, -33.91135787963867, -31.939476013183594, -29.967594146728516, -27.995712280273438, -26.02383041381836, -24.051950454711914, -22.080068588256836, -20.108186721801758, -18.136306762695312, -16.164424896240234, -14.192543029785156, -12.220661163330078, -10.248780250549316, -8.276899337768555, -6.305017471313477, -4.333135604858398, -2.3612546920776367, -0.389373779296875, 1.5825080871582031, 3.554389476776123, 5.526270866394043, 7.498152256011963, 9.470033645629883, 11.441915512084961, 13.413796424865723, 15.385677337646484, 17.357559204101562, 19.32944107055664, 21.30132293701172, 23.273202896118164, 25.245084762573242, 27.21696662902832, 29.188846588134766, 31.160728454589844, 33.13261032104492, 35.1044921875, 37.07637405395508, 39.048255920410156, 41.02013397216797, 42.99201965332031, 44.963897705078125, 46.9357795715332, 48.90766143798828, 50.87954330444336, 52.85142517089844, 54.823307037353516, 56.795188903808594, 58.767066955566406, 60.738948822021484, 62.71083068847656, 64.68270874023438, 66.65458679199219, 68.62647247314453, 70.59835052490234, 72.57023620605469, 74.5421142578125, 76.51399993896484, 78.48587799072266, 80.457763671875]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 8.0, 6.0, 2.0, 2.0, 5.0, 8.0, 8.0, 8.0, 9.0, 13.0, 16.0, 19.0, 18.0, 25.0, 30.0, 26.0, 35.0, 34.0, 36.0, 38.0, 37.0, 45.0, 43.0, 40.0, 46.0, 39.0, 63.0, 40.0, 46.0, 32.0, 23.0, 26.0, 24.0, 29.0, 19.0, 15.0, 16.0, 12.0, 8.0, 9.0, 7.0, 12.0, 7.0, 4.0, 4.0, 5.0, 3.0, 2.0, 0.0, 0.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.53515625, -6.3214111328125, -6.107666015625, -5.8939208984375, -5.68017578125, -5.4664306640625, -5.252685546875, -5.0389404296875, -4.8251953125, -4.6114501953125, -4.397705078125, -4.1839599609375, -3.97021484375, -3.7564697265625, -3.542724609375, -3.3289794921875, -3.115234375, -2.9014892578125, -2.687744140625, -2.4739990234375, -2.26025390625, -2.0465087890625, -1.832763671875, -1.6190185546875, -1.4052734375, -1.1915283203125, -0.977783203125, -0.7640380859375, -0.55029296875, -0.3365478515625, -0.122802734375, 0.0909423828125, 0.3046875, 0.5184326171875, 0.732177734375, 0.9459228515625, 1.15966796875, 1.3734130859375, 1.587158203125, 1.8009033203125, 2.0146484375, 2.2283935546875, 2.442138671875, 2.6558837890625, 2.86962890625, 3.0833740234375, 3.297119140625, 3.5108642578125, 3.724609375, 3.9383544921875, 4.152099609375, 4.3658447265625, 4.57958984375, 4.7933349609375, 5.007080078125, 5.2208251953125, 5.4345703125, 5.6483154296875, 5.862060546875, 6.0758056640625, 6.28955078125, 6.5032958984375, 6.717041015625, 6.9307861328125, 7.14453125]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 8.0, 6.0, 13.0, 21.0, 39.0, 51.0, 69.0, 94.0, 170.0, 248.0, 358.0, 501.0, 679.0, 1040.0, 1590.0, 2242.0, 3376.0, 4780.0, 7045.0, 10458.0, 15408.0, 22632.0, 34583.0, 51116.0, 77387.0, 110941.0, 147149.0, 157669.0, 126405.0, 89143.0, 60510.0, 39794.0, 26825.0, 18041.0, 12245.0, 8298.0, 5520.0, 3900.0, 2583.0, 1810.0, 1204.0, 821.0, 591.0, 381.0, 282.0, 180.0, 128.0, 81.0, 52.0, 41.0, 22.0, 18.0, 5.0, 7.0, 2.0, 1.0, 2.0, 2.0], "bins": [-0.6103515625, -0.5919647216796875, -0.573577880859375, -0.5551910400390625, -0.53680419921875, -0.5184173583984375, -0.500030517578125, -0.4816436767578125, -0.4632568359375, -0.4448699951171875, -0.426483154296875, -0.4080963134765625, -0.38970947265625, -0.3713226318359375, -0.352935791015625, -0.3345489501953125, -0.316162109375, -0.2977752685546875, -0.279388427734375, -0.2610015869140625, -0.24261474609375, -0.2242279052734375, -0.205841064453125, -0.1874542236328125, -0.1690673828125, -0.1506805419921875, -0.132293701171875, -0.1139068603515625, -0.09552001953125, -0.0771331787109375, -0.058746337890625, -0.0403594970703125, -0.02197265625, -0.0035858154296875, 0.014801025390625, 0.0331878662109375, 0.05157470703125, 0.0699615478515625, 0.088348388671875, 0.1067352294921875, 0.1251220703125, 0.1435089111328125, 0.161895751953125, 0.1802825927734375, 0.19866943359375, 0.2170562744140625, 0.235443115234375, 0.2538299560546875, 0.272216796875, 0.2906036376953125, 0.308990478515625, 0.3273773193359375, 0.34576416015625, 0.3641510009765625, 0.382537841796875, 0.4009246826171875, 0.4193115234375, 0.4376983642578125, 0.456085205078125, 0.4744720458984375, 0.49285888671875, 0.5112457275390625, 0.529632568359375, 0.5480194091796875, 0.56640625]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 1.0, 5.0, 6.0, 5.0, 8.0, 10.0, 4.0, 5.0, 15.0, 14.0, 18.0, 23.0, 27.0, 15.0, 24.0, 31.0, 38.0, 32.0, 30.0, 48.0, 36.0, 44.0, 42.0, 1065.0, 38.0, 44.0, 39.0, 32.0, 35.0, 29.0, 37.0, 23.0, 25.0, 21.0, 35.0, 23.0, 21.0, 15.0, 12.0, 12.0, 8.0, 7.0, 6.0, 5.0, 5.0, 5.0, 5.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.5546875, -4.4183349609375, -4.281982421875, -4.1456298828125, -4.00927734375, -3.8729248046875, -3.736572265625, -3.6002197265625, -3.4638671875, -3.3275146484375, -3.191162109375, -3.0548095703125, -2.91845703125, -2.7821044921875, -2.645751953125, -2.5093994140625, -2.373046875, -2.2366943359375, -2.100341796875, -1.9639892578125, -1.82763671875, -1.6912841796875, -1.554931640625, -1.4185791015625, -1.2822265625, -1.1458740234375, -1.009521484375, -0.8731689453125, -0.73681640625, -0.6004638671875, -0.464111328125, -0.3277587890625, -0.19140625, -0.0550537109375, 0.081298828125, 0.2176513671875, 0.35400390625, 0.4903564453125, 0.626708984375, 0.7630615234375, 0.8994140625, 1.0357666015625, 1.172119140625, 1.3084716796875, 1.44482421875, 1.5811767578125, 1.717529296875, 1.8538818359375, 1.990234375, 2.1265869140625, 2.262939453125, 2.3992919921875, 2.53564453125, 2.6719970703125, 2.808349609375, 2.9447021484375, 3.0810546875, 3.2174072265625, 3.353759765625, 3.4901123046875, 3.62646484375, 3.7628173828125, 3.899169921875, 4.0355224609375, 4.171875]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 9.0, 18.0, 24.0, 35.0, 52.0, 72.0, 128.0, 202.0, 290.0, 498.0, 827.0, 1311.0, 1945.0, 3292.0, 5429.0, 8747.0, 13987.0, 22692.0, 36774.0, 58017.0, 89471.0, 127933.0, 1047659.0, 316026.0, 125412.0, 86720.0, 56909.0, 35565.0, 21751.0, 13566.0, 8385.0, 5147.0, 3148.0, 1857.0, 1184.0, 735.0, 478.0, 281.0, 180.0, 131.0, 85.0, 57.0, 32.0, 21.0, 19.0, 16.0, 11.0, 2.0, 3.0, 1.0, 0.0, 3.0], "bins": [-0.58447265625, -0.5677566528320312, -0.5510406494140625, -0.5343246459960938, -0.517608642578125, -0.5008926391601562, -0.4841766357421875, -0.46746063232421875, -0.45074462890625, -0.43402862548828125, -0.4173126220703125, -0.40059661865234375, -0.383880615234375, -0.36716461181640625, -0.3504486083984375, -0.33373260498046875, -0.3170166015625, -0.30030059814453125, -0.2835845947265625, -0.26686859130859375, -0.250152587890625, -0.23343658447265625, -0.2167205810546875, -0.20000457763671875, -0.18328857421875, -0.16657257080078125, -0.1498565673828125, -0.13314056396484375, -0.116424560546875, -0.09970855712890625, -0.0829925537109375, -0.06627655029296875, -0.049560546875, -0.03284454345703125, -0.0161285400390625, 0.00058746337890625, 0.017303466796875, 0.03401947021484375, 0.0507354736328125, 0.06745147705078125, 0.08416748046875, 0.10088348388671875, 0.1175994873046875, 0.13431549072265625, 0.151031494140625, 0.16774749755859375, 0.1844635009765625, 0.20117950439453125, 0.2178955078125, 0.23461151123046875, 0.2513275146484375, 0.26804351806640625, 0.284759521484375, 0.30147552490234375, 0.3181915283203125, 0.33490753173828125, 0.35162353515625, 0.36833953857421875, 0.3850555419921875, 0.40177154541015625, 0.418487548828125, 0.43520355224609375, 0.4519195556640625, 0.46863555908203125, 0.4853515625]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 5.0, 5.0, 3.0, 9.0, 16.0, 14.0, 27.0, 25.0, 36.0, 47.0, 54.0, 63.0, 60.0, 65.0, 74.0, 78.0, 80.0, 44.0, 53.0, 41.0, 47.0, 39.0, 22.0, 18.0, 13.0, 24.0, 11.0, 2.0, 5.0, 8.0, 6.0, 2.0, 3.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0037250518798828125, -0.0035968124866485596, -0.0034685730934143066, -0.0033403337001800537, -0.0032120943069458008, -0.003083854913711548, -0.002955615520477295, -0.002827376127243042, -0.002699136734008789, -0.002570897340774536, -0.002442657947540283, -0.0023144185543060303, -0.0021861791610717773, -0.0020579397678375244, -0.0019297003746032715, -0.0018014609813690186, -0.0016732215881347656, -0.0015449821949005127, -0.0014167428016662598, -0.0012885034084320068, -0.001160264015197754, -0.001032024621963501, -0.000903785228729248, -0.0007755458354949951, -0.0006473064422607422, -0.0005190670490264893, -0.00039082765579223633, -0.0002625882625579834, -0.00013434886932373047, -6.109476089477539e-06, 0.0001221299171447754, 0.0002503693103790283, 0.00037860870361328125, 0.0005068480968475342, 0.0006350874900817871, 0.00076332688331604, 0.000891566276550293, 0.001019805669784546, 0.0011480450630187988, 0.0012762844562530518, 0.0014045238494873047, 0.0015327632427215576, 0.0016610026359558105, 0.0017892420291900635, 0.0019174814224243164, 0.0020457208156585693, 0.0021739602088928223, 0.002302199602127075, 0.002430438995361328, 0.002558678388595581, 0.002686917781829834, 0.002815157175064087, 0.00294339656829834, 0.0030716359615325928, 0.0031998753547668457, 0.0033281147480010986, 0.0034563541412353516, 0.0035845935344696045, 0.0037128329277038574, 0.0038410723209381104, 0.003969311714172363, 0.004097551107406616, 0.004225790500640869, 0.004354029893875122, 0.004482269287109375]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 9.0, 9.0, 7.0, 18.0, 25.0, 36.0, 25.0, 56.0, 76.0, 115.0, 183.0, 351.0, 3169.0, 955740.0, 87006.0, 978.0, 267.0, 156.0, 108.0, 69.0, 45.0, 31.0, 30.0, 16.0, 4.0, 7.0, 5.0, 2.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11474609375, -0.1115407943725586, -0.10833549499511719, -0.10513019561767578, -0.10192489624023438, -0.09871959686279297, -0.09551429748535156, -0.09230899810791016, -0.08910369873046875, -0.08589839935302734, -0.08269309997558594, -0.07948780059814453, -0.07628250122070312, -0.07307720184326172, -0.06987190246582031, -0.0666666030883789, -0.0634613037109375, -0.060256004333496094, -0.05705070495605469, -0.05384540557861328, -0.050640106201171875, -0.04743480682373047, -0.04422950744628906, -0.041024208068847656, -0.03781890869140625, -0.034613609313964844, -0.03140830993652344, -0.02820301055908203, -0.024997711181640625, -0.02179241180419922, -0.018587112426757812, -0.015381813049316406, -0.012176513671875, -0.008971214294433594, -0.0057659149169921875, -0.0025606155395507812, 0.000644683837890625, 0.0038499832153320312, 0.0070552825927734375, 0.010260581970214844, 0.01346588134765625, 0.016671180725097656, 0.019876480102539062, 0.02308177947998047, 0.026287078857421875, 0.02949237823486328, 0.03269767761230469, 0.035902976989746094, 0.0391082763671875, 0.042313575744628906, 0.04551887512207031, 0.04872417449951172, 0.051929473876953125, 0.05513477325439453, 0.05834007263183594, 0.061545372009277344, 0.06475067138671875, 0.06795597076416016, 0.07116127014160156, 0.07436656951904297, 0.07757186889648438, 0.08077716827392578, 0.08398246765136719, 0.0871877670288086, 0.09039306640625]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 180.0, 805.0, 29.0, 4.0], "bins": [-0.06408385932445526, -0.06303854286670685, -0.061993226408958435, -0.06094790995121002, -0.05990259349346161, -0.058857280761003494, -0.05781196430325508, -0.05676664784550667, -0.055721331387758255, -0.05467601493000984, -0.05363069847226143, -0.052585382014513016, -0.0515400692820549, -0.05049475282430649, -0.049449436366558075, -0.04840411990880966, -0.04735880345106125, -0.046313486993312836, -0.04526817053556442, -0.04422285407781601, -0.043177537620067596, -0.04213222488760948, -0.04108690842986107, -0.040041591972112656, -0.03899627551436424, -0.03795095905661583, -0.036905642598867416, -0.035860326141119, -0.03481501340866089, -0.033769696950912476, -0.03272438049316406, -0.03167906403541565, -0.030633747577667236, -0.029588431119918823, -0.02854311466217041, -0.027497800067067146, -0.026452483609318733, -0.02540716715157032, -0.024361852556467056, -0.023316536098718643, -0.02227121964097023, -0.021225903183221817, -0.020180586725473404, -0.01913527213037014, -0.018089955672621727, -0.017044639214873314, -0.01599932461977005, -0.014954008162021637, -0.01390869077295065, -0.01286337524652481, -0.011818058788776398, -0.010772742331027985, -0.009727426804602146, -0.008682111278176308, -0.007636794820427895, -0.006591478828340769, -0.005546162836253643, -0.004500846844166517, -0.0034555308520793915, -0.0024102148599922657, -0.00136489886790514, -0.00031958287581801414, 0.0007257331162691116, 0.0017710491083562374, 0.0028163648676127195]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 5.0, 10.0, 10.0, 7.0, 14.0, 16.0, 10.0, 20.0, 23.0, 30.0, 30.0, 40.0, 43.0, 39.0, 46.0, 52.0, 52.0, 73.0, 50.0, 55.0, 41.0, 35.0, 49.0, 40.0, 40.0, 31.0, 35.0, 22.0, 18.0, 14.0, 11.0, 13.0, 12.0, 3.0, 4.0, 8.0, 1.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001860976219177246, -0.0017893752083182335, -0.0017177741974592209, -0.0016461731866002083, -0.0015745721757411957, -0.001502971164882183, -0.0014313701540231705, -0.0013597691431641579, -0.0012881681323051453, -0.0012165671214461327, -0.00114496611058712, -0.0010733650997281075, -0.0010017640888690948, -0.0009301630780100822, -0.0008585620671510696, -0.000786961056292057, -0.0007153600454330444, -0.0006437590345740318, -0.0005721580237150192, -0.0005005570128560066, -0.000428956001996994, -0.0003573549911379814, -0.0002857539802789688, -0.0002141529694199562, -0.0001425519585609436, -7.0950947701931e-05, 6.50063157081604e-07, 7.225107401609421e-05, 0.0001438520848751068, 0.00021545309573411942, 0.000287054106593132, 0.0003586551174521446, 0.0004302561283111572, 0.0005018571391701698, 0.0005734581500291824, 0.000645059160888195, 0.0007166601717472076, 0.0007882611826062202, 0.0008598621934652328, 0.0009314632043242455, 0.001003064215183258, 0.0010746652260422707, 0.0011462662369012833, 0.0012178672477602959, 0.0012894682586193085, 0.001361069269478321, 0.0014326702803373337, 0.0015042712911963463, 0.0015758723020553589, 0.0016474733129143715, 0.001719074323773384, 0.0017906753346323967, 0.0018622763454914093, 0.001933877356350422, 0.0020054783672094345, 0.002077079378068447, 0.0021486803889274597, 0.0022202813997864723, 0.002291882410645485, 0.0023634834215044975, 0.00243508443236351, 0.0025066854432225227, 0.0025782864540815353, 0.002649887464940548, 0.0027214884757995605]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 8.0, 6.0, 2.0, 2.0, 5.0, 8.0, 8.0, 8.0, 9.0, 13.0, 16.0, 19.0, 18.0, 25.0, 30.0, 26.0, 35.0, 34.0, 36.0, 38.0, 37.0, 45.0, 43.0, 41.0, 45.0, 39.0, 63.0, 40.0, 46.0, 32.0, 23.0, 26.0, 24.0, 29.0, 19.0, 15.0, 16.0, 12.0, 8.0, 9.0, 7.0, 12.0, 7.0, 4.0, 4.0, 5.0, 3.0, 2.0, 0.0, 0.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.53515625, -6.3214111328125, -6.107666015625, -5.8939208984375, -5.68017578125, -5.4664306640625, -5.252685546875, -5.0389404296875, -4.8251953125, -4.6114501953125, -4.397705078125, -4.1839599609375, -3.97021484375, -3.7564697265625, -3.542724609375, -3.3289794921875, -3.115234375, -2.9014892578125, -2.687744140625, -2.4739990234375, -2.26025390625, -2.0465087890625, -1.832763671875, -1.6190185546875, -1.4052734375, -1.1915283203125, -0.977783203125, -0.7640380859375, -0.55029296875, -0.3365478515625, -0.122802734375, 0.0909423828125, 0.3046875, 0.5184326171875, 0.732177734375, 0.9459228515625, 1.15966796875, 1.3734130859375, 1.587158203125, 1.8009033203125, 2.0146484375, 2.2283935546875, 2.442138671875, 2.6558837890625, 2.86962890625, 3.0833740234375, 3.297119140625, 3.5108642578125, 3.724609375, 3.9383544921875, 4.152099609375, 4.3658447265625, 4.57958984375, 4.7933349609375, 5.007080078125, 5.2208251953125, 5.4345703125, 5.6483154296875, 5.862060546875, 6.0758056640625, 6.28955078125, 6.5032958984375, 6.717041015625, 6.9307861328125, 7.14453125]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 6.0, 5.0, 9.0, 10.0, 10.0, 17.0, 23.0, 35.0, 31.0, 61.0, 107.0, 158.0, 281.0, 513.0, 916.0, 1770.0, 3797.0, 7901.0, 17252.0, 39542.0, 98640.0, 309182.0, 369647.0, 115727.0, 45733.0, 19661.0, 8954.0, 4176.0, 2034.0, 986.0, 553.0, 294.0, 182.0, 110.0, 67.0, 44.0, 37.0, 12.0, 15.0, 15.0, 15.0, 7.0, 4.0, 5.0, 5.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.05859375, -5.857177734375, -5.65576171875, -5.454345703125, -5.2529296875, -5.051513671875, -4.85009765625, -4.648681640625, -4.447265625, -4.245849609375, -4.04443359375, -3.843017578125, -3.6416015625, -3.440185546875, -3.23876953125, -3.037353515625, -2.8359375, -2.634521484375, -2.43310546875, -2.231689453125, -2.0302734375, -1.828857421875, -1.62744140625, -1.426025390625, -1.224609375, -1.023193359375, -0.82177734375, -0.620361328125, -0.4189453125, -0.217529296875, -0.01611328125, 0.185302734375, 0.38671875, 0.588134765625, 0.78955078125, 0.990966796875, 1.1923828125, 1.393798828125, 1.59521484375, 1.796630859375, 1.998046875, 2.199462890625, 2.40087890625, 2.602294921875, 2.8037109375, 3.005126953125, 3.20654296875, 3.407958984375, 3.609375, 3.810791015625, 4.01220703125, 4.213623046875, 4.4150390625, 4.616455078125, 4.81787109375, 5.019287109375, 5.220703125, 5.422119140625, 5.62353515625, 5.824951171875, 6.0263671875, 6.227783203125, 6.42919921875, 6.630615234375, 6.83203125]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 6.0, 4.0, 6.0, 4.0, 13.0, 17.0, 22.0, 18.0, 23.0, 24.0, 30.0, 27.0, 33.0, 39.0, 40.0, 47.0, 50.0, 75.0, 246.0, 1605.0, 190.0, 83.0, 53.0, 43.0, 47.0, 44.0, 39.0, 28.0, 33.0, 26.0, 20.0, 23.0, 18.0, 14.0, 6.0, 16.0, 6.0, 8.0, 9.0, 1.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-23.078125, -22.40673828125, -21.7353515625, -21.06396484375, -20.392578125, -19.72119140625, -19.0498046875, -18.37841796875, -17.70703125, -17.03564453125, -16.3642578125, -15.69287109375, -15.021484375, -14.35009765625, -13.6787109375, -13.00732421875, -12.3359375, -11.66455078125, -10.9931640625, -10.32177734375, -9.650390625, -8.97900390625, -8.3076171875, -7.63623046875, -6.96484375, -6.29345703125, -5.6220703125, -4.95068359375, -4.279296875, -3.60791015625, -2.9365234375, -2.26513671875, -1.59375, -0.92236328125, -0.2509765625, 0.42041015625, 1.091796875, 1.76318359375, 2.4345703125, 3.10595703125, 3.77734375, 4.44873046875, 5.1201171875, 5.79150390625, 6.462890625, 7.13427734375, 7.8056640625, 8.47705078125, 9.1484375, 9.81982421875, 10.4912109375, 11.16259765625, 11.833984375, 12.50537109375, 13.1767578125, 13.84814453125, 14.51953125, 15.19091796875, 15.8623046875, 16.53369140625, 17.205078125, 17.87646484375, 18.5478515625, 19.21923828125, 19.890625]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 6.0, 3.0, 12.0, 11.0, 9.0, 10.0, 14.0, 15.0, 28.0, 27.0, 28.0, 48.0, 46.0, 88.0, 87.0, 145.0, 170.0, 193.0, 348.0, 631.0, 2735.0, 78505.0, 3007643.0, 50891.0, 2279.0, 578.0, 311.0, 201.0, 149.0, 124.0, 63.0, 62.0, 53.0, 40.0, 31.0, 29.0, 28.0, 12.0, 7.0, 10.0, 11.0, 4.0, 5.0, 5.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-33.0, -31.87939453125, -30.7587890625, -29.63818359375, -28.517578125, -27.39697265625, -26.2763671875, -25.15576171875, -24.03515625, -22.91455078125, -21.7939453125, -20.67333984375, -19.552734375, -18.43212890625, -17.3115234375, -16.19091796875, -15.0703125, -13.94970703125, -12.8291015625, -11.70849609375, -10.587890625, -9.46728515625, -8.3466796875, -7.22607421875, -6.10546875, -4.98486328125, -3.8642578125, -2.74365234375, -1.623046875, -0.50244140625, 0.6181640625, 1.73876953125, 2.859375, 3.97998046875, 5.1005859375, 6.22119140625, 7.341796875, 8.46240234375, 9.5830078125, 10.70361328125, 11.82421875, 12.94482421875, 14.0654296875, 15.18603515625, 16.306640625, 17.42724609375, 18.5478515625, 19.66845703125, 20.7890625, 21.90966796875, 23.0302734375, 24.15087890625, 25.271484375, 26.39208984375, 27.5126953125, 28.63330078125, 29.75390625, 30.87451171875, 31.9951171875, 33.11572265625, 34.236328125, 35.35693359375, 36.4775390625, 37.59814453125, 38.71875]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 171.0, 722.0, 119.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-268.3849792480469, -263.5423583984375, -258.6997375488281, -253.8571014404297, -249.01446533203125, -244.17184448242188, -239.32920837402344, -234.48658752441406, -229.64395141601562, -224.80133056640625, -219.9586944580078, -215.11607360839844, -210.2734375, -205.43081665039062, -200.5881805419922, -195.7455596923828, -190.90293884277344, -186.06031799316406, -181.21768188476562, -176.37506103515625, -171.5324249267578, -166.68980407714844, -161.84716796875, -157.00454711914062, -152.16192626953125, -147.31930541992188, -142.47666931152344, -137.63404846191406, -132.79141235351562, -127.94879150390625, -123.10616302490234, -118.26353454589844, -113.42090606689453, -108.57827758789062, -103.73564910888672, -98.89302062988281, -94.05039978027344, -89.207763671875, -84.36514282226562, -79.52251434326172, -74.67988586425781, -69.8372573852539, -64.99462890625, -60.15200424194336, -55.30937576293945, -50.46674728393555, -45.624122619628906, -40.781494140625, -35.938865661621094, -31.096237182617188, -26.253610610961914, -21.41098403930664, -16.568355560302734, -11.725727081298828, -6.883100509643555, -2.0404739379882812, 2.802154541015625, 7.644782066345215, 12.487409591674805, 17.330036163330078, 22.172664642333984, 27.01529312133789, 31.857919692993164, 36.70054626464844, 41.543174743652344]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 6.0, 2.0, 3.0, 10.0, 10.0, 11.0, 5.0, 11.0, 12.0, 19.0, 21.0, 16.0, 18.0, 25.0, 29.0, 37.0, 20.0, 35.0, 33.0, 33.0, 34.0, 48.0, 36.0, 41.0, 43.0, 33.0, 36.0, 41.0, 38.0, 30.0, 34.0, 22.0, 21.0, 32.0, 22.0, 13.0, 22.0, 14.0, 14.0, 10.0, 12.0, 11.0, 14.0, 15.0, 7.0, 3.0, 4.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-50.861915588378906, -49.33371353149414, -47.80550765991211, -46.277305603027344, -44.74910354614258, -43.22089767456055, -41.69269561767578, -40.16448974609375, -38.636287689208984, -37.10808563232422, -35.57987976074219, -34.05167770385742, -32.523475646972656, -30.995269775390625, -29.46706771850586, -27.93886375427246, -26.410661697387695, -24.882457733154297, -23.35425567626953, -21.826051712036133, -20.297847747802734, -18.76964569091797, -17.24144172668457, -15.713237762451172, -14.18503475189209, -12.656831741333008, -11.12862777709961, -9.600424766540527, -8.072221755981445, -6.544017791748047, -5.015814781188965, -3.4876108169555664, -1.9594078063964844, -0.4312044382095337, 1.096998929977417, 2.625202178955078, 4.153405666351318, 5.681609153747559, 7.209812164306641, 8.738016128540039, 10.266219139099121, 11.794422149658203, 13.322626113891602, 14.850829124450684, 16.379032135009766, 17.907236099243164, 19.435440063476562, 20.963642120361328, 22.491846084594727, 24.020050048828125, 25.54825210571289, 27.07645606994629, 28.604660034179688, 30.132862091064453, 31.66106605529785, 33.18927001953125, 34.717472076416016, 36.24567413330078, 37.77388000488281, 39.30208206176758, 40.830284118652344, 42.358489990234375, 43.88669204711914, 45.414894104003906, 46.94309997558594]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 4.0, 3.0, 2.0, 6.0, 4.0, 5.0, 9.0, 3.0, 9.0, 5.0, 9.0, 18.0, 8.0, 17.0, 25.0, 24.0, 22.0, 23.0, 30.0, 30.0, 45.0, 36.0, 35.0, 52.0, 41.0, 47.0, 45.0, 50.0, 34.0, 40.0, 39.0, 31.0, 33.0, 29.0, 25.0, 34.0, 16.0, 17.0, 15.0, 15.0, 11.0, 10.0, 9.0, 8.0, 7.0, 9.0, 6.0, 7.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0], "bins": [-6.47265625, -6.2568359375, -6.041015625, -5.8251953125, -5.609375, -5.3935546875, -5.177734375, -4.9619140625, -4.74609375, -4.5302734375, -4.314453125, -4.0986328125, -3.8828125, -3.6669921875, -3.451171875, -3.2353515625, -3.01953125, -2.8037109375, -2.587890625, -2.3720703125, -2.15625, -1.9404296875, -1.724609375, -1.5087890625, -1.29296875, -1.0771484375, -0.861328125, -0.6455078125, -0.4296875, -0.2138671875, 0.001953125, 0.2177734375, 0.43359375, 0.6494140625, 0.865234375, 1.0810546875, 1.296875, 1.5126953125, 1.728515625, 1.9443359375, 2.16015625, 2.3759765625, 2.591796875, 2.8076171875, 3.0234375, 3.2392578125, 3.455078125, 3.6708984375, 3.88671875, 4.1025390625, 4.318359375, 4.5341796875, 4.75, 4.9658203125, 5.181640625, 5.3974609375, 5.61328125, 5.8291015625, 6.044921875, 6.2607421875, 6.4765625, 6.6923828125, 6.908203125, 7.1240234375, 7.33984375]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 6.0, 7.0, 8.0, 8.0, 7.0, 15.0, 15.0, 21.0, 24.0, 18.0, 35.0, 41.0, 47.0, 79.0, 129.0, 274.0, 619.0, 1559.0, 6461.0, 37763.0, 524763.0, 3077826.0, 499595.0, 35799.0, 6166.0, 1636.0, 615.0, 252.0, 138.0, 91.0, 38.0, 36.0, 44.0, 27.0, 24.0, 18.0, 18.0, 11.0, 8.0, 10.0, 2.0, 7.0, 4.0, 5.0, 8.0, 2.0, 4.0, 1.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.734375, -17.133056640625, -16.53173828125, -15.930419921875, -15.3291015625, -14.727783203125, -14.12646484375, -13.525146484375, -12.923828125, -12.322509765625, -11.72119140625, -11.119873046875, -10.5185546875, -9.917236328125, -9.31591796875, -8.714599609375, -8.11328125, -7.511962890625, -6.91064453125, -6.309326171875, -5.7080078125, -5.106689453125, -4.50537109375, -3.904052734375, -3.302734375, -2.701416015625, -2.10009765625, -1.498779296875, -0.8974609375, -0.296142578125, 0.30517578125, 0.906494140625, 1.5078125, 2.109130859375, 2.71044921875, 3.311767578125, 3.9130859375, 4.514404296875, 5.11572265625, 5.717041015625, 6.318359375, 6.919677734375, 7.52099609375, 8.122314453125, 8.7236328125, 9.324951171875, 9.92626953125, 10.527587890625, 11.12890625, 11.730224609375, 12.33154296875, 12.932861328125, 13.5341796875, 14.135498046875, 14.73681640625, 15.338134765625, 15.939453125, 16.540771484375, 17.14208984375, 17.743408203125, 18.3447265625, 18.946044921875, 19.54736328125, 20.148681640625, 20.75]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 6.0, 5.0, 8.0, 11.0, 10.0, 13.0, 18.0, 23.0, 24.0, 31.0, 47.0, 67.0, 78.0, 88.0, 122.0, 163.0, 206.0, 272.0, 287.0, 380.0, 397.0, 346.0, 339.0, 269.0, 180.0, 138.0, 114.0, 76.0, 67.0, 69.0, 44.0, 42.0, 29.0, 28.0, 19.0, 15.0, 7.0, 10.0, 7.0, 2.0, 4.0, 3.0, 1.0, 2.0, 5.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.859375, -9.5361328125, -9.212890625, -8.8896484375, -8.56640625, -8.2431640625, -7.919921875, -7.5966796875, -7.2734375, -6.9501953125, -6.626953125, -6.3037109375, -5.98046875, -5.6572265625, -5.333984375, -5.0107421875, -4.6875, -4.3642578125, -4.041015625, -3.7177734375, -3.39453125, -3.0712890625, -2.748046875, -2.4248046875, -2.1015625, -1.7783203125, -1.455078125, -1.1318359375, -0.80859375, -0.4853515625, -0.162109375, 0.1611328125, 0.484375, 0.8076171875, 1.130859375, 1.4541015625, 1.77734375, 2.1005859375, 2.423828125, 2.7470703125, 3.0703125, 3.3935546875, 3.716796875, 4.0400390625, 4.36328125, 4.6865234375, 5.009765625, 5.3330078125, 5.65625, 5.9794921875, 6.302734375, 6.6259765625, 6.94921875, 7.2724609375, 7.595703125, 7.9189453125, 8.2421875, 8.5654296875, 8.888671875, 9.2119140625, 9.53515625, 9.8583984375, 10.181640625, 10.5048828125, 10.828125]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 4.0, 8.0, 9.0, 8.0, 11.0, 15.0, 14.0, 38.0, 44.0, 70.0, 79.0, 105.0, 143.0, 176.0, 265.0, 354.0, 1115.0, 13381.0, 2391994.0, 1772393.0, 11662.0, 983.0, 379.0, 296.0, 178.0, 147.0, 105.0, 75.0, 64.0, 53.0, 34.0, 22.0, 17.0, 15.0, 11.0, 8.0, 7.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-62.75, -61.005859375, -59.26171875, -57.517578125, -55.7734375, -54.029296875, -52.28515625, -50.541015625, -48.796875, -47.052734375, -45.30859375, -43.564453125, -41.8203125, -40.076171875, -38.33203125, -36.587890625, -34.84375, -33.099609375, -31.35546875, -29.611328125, -27.8671875, -26.123046875, -24.37890625, -22.634765625, -20.890625, -19.146484375, -17.40234375, -15.658203125, -13.9140625, -12.169921875, -10.42578125, -8.681640625, -6.9375, -5.193359375, -3.44921875, -1.705078125, 0.0390625, 1.783203125, 3.52734375, 5.271484375, 7.015625, 8.759765625, 10.50390625, 12.248046875, 13.9921875, 15.736328125, 17.48046875, 19.224609375, 20.96875, 22.712890625, 24.45703125, 26.201171875, 27.9453125, 29.689453125, 31.43359375, 33.177734375, 34.921875, 36.666015625, 38.41015625, 40.154296875, 41.8984375, 43.642578125, 45.38671875, 47.130859375, 48.875]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 19.0, 210.0, 500.0, 243.0, 37.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-323.2208557128906, -316.421630859375, -309.6224060058594, -302.82318115234375, -296.02398681640625, -289.2247619628906, -282.425537109375, -275.6263122558594, -268.82708740234375, -262.0278625488281, -255.22865295410156, -248.42942810058594, -241.6302032470703, -234.83099365234375, -228.03176879882812, -221.2325439453125, -214.433349609375, -207.63412475585938, -200.8349151611328, -194.0356903076172, -187.23646545410156, -180.437255859375, -173.63803100585938, -166.83880615234375, -160.03958129882812, -153.2403564453125, -146.44114685058594, -139.6419219970703, -132.8426971435547, -126.04348754882812, -119.2442626953125, -112.4450454711914, -105.64582061767578, -98.84660339355469, -92.04737854003906, -85.24816131591797, -78.44894409179688, -71.64971923828125, -64.85050201416016, -58.05128479003906, -51.2520637512207, -44.452842712402344, -37.65362548828125, -30.85440444946289, -24.055185317993164, -17.255966186523438, -10.456745147705078, -3.6575279235839844, 3.141693115234375, 9.940912246704102, 16.740131378173828, 23.539352416992188, 30.338571548461914, 37.13779067993164, 43.93701171875, 50.736228942871094, 57.53544998168945, 64.33467102050781, 71.1338882446289, 77.93310546875, 84.73233032226562, 91.53154754638672, 98.33076477050781, 105.12998962402344, 111.92920684814453]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 4.0, 6.0, 7.0, 7.0, 15.0, 14.0, 11.0, 21.0, 20.0, 23.0, 23.0, 33.0, 31.0, 34.0, 31.0, 39.0, 26.0, 33.0, 33.0, 32.0, 45.0, 37.0, 54.0, 38.0, 48.0, 35.0, 21.0, 31.0, 37.0, 28.0, 29.0, 20.0, 25.0, 20.0, 17.0, 20.0, 9.0, 6.0, 5.0, 7.0, 4.0, 3.0, 8.0, 3.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-39.93975830078125, -38.61375427246094, -37.287750244140625, -35.96174621582031, -34.6357421875, -33.30973434448242, -31.98373031616211, -30.657726287841797, -29.331722259521484, -28.005718231201172, -26.67971420288086, -25.353708267211914, -24.0277042388916, -22.70170021057129, -21.375694274902344, -20.04969024658203, -18.72368621826172, -17.397682189941406, -16.071678161621094, -14.745672225952148, -13.419668197631836, -12.093664169311523, -10.767659187316895, -9.441654205322266, -8.115650177001953, -6.789645671844482, -5.463641166687012, -4.137636661529541, -2.8116321563720703, -1.4856276512145996, -0.1596231460571289, 1.1663818359375, 2.4923858642578125, 3.818390369415283, 5.144394874572754, 6.470399379730225, 7.796403884887695, 9.122407913208008, 10.448412895202637, 11.774417877197266, 13.100421905517578, 14.42642593383789, 15.75243091583252, 17.07843589782715, 18.40443992614746, 19.730443954467773, 21.05644989013672, 22.38245391845703, 23.708457946777344, 25.034461975097656, 26.36046600341797, 27.686471939086914, 29.012475967407227, 30.33847999572754, 31.664485931396484, 32.9904899597168, 34.31649398803711, 35.64249801635742, 36.968502044677734, 38.29450607299805, 39.620513916015625, 40.94651794433594, 42.27252197265625, 43.59852600097656, 44.924530029296875]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 4.0, 2.0, 8.0, 9.0, 8.0, 11.0, 15.0, 15.0, 8.0, 15.0, 20.0, 15.0, 26.0, 28.0, 37.0, 36.0, 27.0, 41.0, 38.0, 38.0, 44.0, 57.0, 42.0, 42.0, 37.0, 49.0, 37.0, 42.0, 31.0, 29.0, 28.0, 25.0, 22.0, 23.0, 7.0, 19.0, 10.0, 10.0, 12.0, 9.0, 13.0, 4.0, 3.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0], "bins": [-7.6328125, -7.4022216796875, -7.171630859375, -6.9410400390625, -6.71044921875, -6.4798583984375, -6.249267578125, -6.0186767578125, -5.7880859375, -5.5574951171875, -5.326904296875, -5.0963134765625, -4.86572265625, -4.6351318359375, -4.404541015625, -4.1739501953125, -3.943359375, -3.7127685546875, -3.482177734375, -3.2515869140625, -3.02099609375, -2.7904052734375, -2.559814453125, -2.3292236328125, -2.0986328125, -1.8680419921875, -1.637451171875, -1.4068603515625, -1.17626953125, -0.9456787109375, -0.715087890625, -0.4844970703125, -0.25390625, -0.0233154296875, 0.207275390625, 0.4378662109375, 0.66845703125, 0.8990478515625, 1.129638671875, 1.3602294921875, 1.5908203125, 1.8214111328125, 2.052001953125, 2.2825927734375, 2.51318359375, 2.7437744140625, 2.974365234375, 3.2049560546875, 3.435546875, 3.6661376953125, 3.896728515625, 4.1273193359375, 4.35791015625, 4.5885009765625, 4.819091796875, 5.0496826171875, 5.2802734375, 5.5108642578125, 5.741455078125, 5.9720458984375, 6.20263671875, 6.4332275390625, 6.663818359375, 6.8944091796875, 7.125]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 4.0, 7.0, 7.0, 19.0, 20.0, 29.0, 47.0, 75.0, 97.0, 160.0, 221.0, 346.0, 565.0, 846.0, 1405.0, 2005.0, 3142.0, 4988.0, 7669.0, 11979.0, 18687.0, 29086.0, 45537.0, 71464.0, 109937.0, 154187.0, 173919.0, 141053.0, 97030.0, 62404.0, 40440.0, 25604.0, 16204.0, 10365.0, 6839.0, 4295.0, 2744.0, 1812.0, 1166.0, 739.0, 496.0, 315.0, 197.0, 147.0, 89.0, 64.0, 30.0, 28.0, 13.0, 16.0, 5.0, 9.0, 6.0, 8.0], "bins": [-0.76904296875, -0.7478866577148438, -0.7267303466796875, -0.7055740356445312, -0.684417724609375, -0.6632614135742188, -0.6421051025390625, -0.6209487915039062, -0.59979248046875, -0.5786361694335938, -0.5574798583984375, -0.5363235473632812, -0.515167236328125, -0.49401092529296875, -0.4728546142578125, -0.45169830322265625, -0.4305419921875, -0.40938568115234375, -0.3882293701171875, -0.36707305908203125, -0.345916748046875, -0.32476043701171875, -0.3036041259765625, -0.28244781494140625, -0.26129150390625, -0.24013519287109375, -0.2189788818359375, -0.19782257080078125, -0.176666259765625, -0.15550994873046875, -0.1343536376953125, -0.11319732666015625, -0.092041015625, -0.07088470458984375, -0.0497283935546875, -0.02857208251953125, -0.007415771484375, 0.01374053955078125, 0.0348968505859375, 0.05605316162109375, 0.07720947265625, 0.09836578369140625, 0.1195220947265625, 0.14067840576171875, 0.161834716796875, 0.18299102783203125, 0.2041473388671875, 0.22530364990234375, 0.2464599609375, 0.26761627197265625, 0.2887725830078125, 0.30992889404296875, 0.331085205078125, 0.35224151611328125, 0.3733978271484375, 0.39455413818359375, 0.41571044921875, 0.43686676025390625, 0.4580230712890625, 0.47917938232421875, 0.500335693359375, 0.5214920043945312, 0.5426483154296875, 0.5638046264648438, 0.5849609375]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 7.0, 3.0, 2.0, 3.0, 10.0, 6.0, 8.0, 11.0, 12.0, 17.0, 17.0, 26.0, 26.0, 20.0, 39.0, 31.0, 37.0, 36.0, 46.0, 37.0, 43.0, 34.0, 41.0, 1064.0, 47.0, 42.0, 39.0, 45.0, 34.0, 30.0, 30.0, 30.0, 21.0, 12.0, 23.0, 15.0, 19.0, 14.0, 16.0, 6.0, 13.0, 6.0, 4.0, 4.0, 4.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.015625, -4.864013671875, -4.71240234375, -4.560791015625, -4.4091796875, -4.257568359375, -4.10595703125, -3.954345703125, -3.802734375, -3.651123046875, -3.49951171875, -3.347900390625, -3.1962890625, -3.044677734375, -2.89306640625, -2.741455078125, -2.58984375, -2.438232421875, -2.28662109375, -2.135009765625, -1.9833984375, -1.831787109375, -1.68017578125, -1.528564453125, -1.376953125, -1.225341796875, -1.07373046875, -0.922119140625, -0.7705078125, -0.618896484375, -0.46728515625, -0.315673828125, -0.1640625, -0.012451171875, 0.13916015625, 0.290771484375, 0.4423828125, 0.593994140625, 0.74560546875, 0.897216796875, 1.048828125, 1.200439453125, 1.35205078125, 1.503662109375, 1.6552734375, 1.806884765625, 1.95849609375, 2.110107421875, 2.26171875, 2.413330078125, 2.56494140625, 2.716552734375, 2.8681640625, 3.019775390625, 3.17138671875, 3.322998046875, 3.474609375, 3.626220703125, 3.77783203125, 3.929443359375, 4.0810546875, 4.232666015625, 4.38427734375, 4.535888671875, 4.6875]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 7.0, 8.0, 9.0, 16.0, 36.0, 44.0, 78.0, 128.0, 196.0, 337.0, 638.0, 1046.0, 1929.0, 3436.0, 5730.0, 9936.0, 16706.0, 29097.0, 48792.0, 80270.0, 126686.0, 184959.0, 1219194.0, 140062.0, 92006.0, 56130.0, 33060.0, 19352.0, 11491.0, 6638.0, 3877.0, 2155.0, 1279.0, 766.0, 448.0, 214.0, 164.0, 94.0, 54.0, 31.0, 21.0, 9.0, 6.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.57275390625, -0.5530929565429688, -0.5334320068359375, -0.5137710571289062, -0.494110107421875, -0.47444915771484375, -0.4547882080078125, -0.43512725830078125, -0.41546630859375, -0.39580535888671875, -0.3761444091796875, -0.35648345947265625, -0.336822509765625, -0.31716156005859375, -0.2975006103515625, -0.27783966064453125, -0.2581787109375, -0.23851776123046875, -0.2188568115234375, -0.19919586181640625, -0.179534912109375, -0.15987396240234375, -0.1402130126953125, -0.12055206298828125, -0.10089111328125, -0.08123016357421875, -0.0615692138671875, -0.04190826416015625, -0.022247314453125, -0.00258636474609375, 0.0170745849609375, 0.03673553466796875, 0.056396484375, 0.07605743408203125, 0.0957183837890625, 0.11537933349609375, 0.135040283203125, 0.15470123291015625, 0.1743621826171875, 0.19402313232421875, 0.21368408203125, 0.23334503173828125, 0.2530059814453125, 0.27266693115234375, 0.292327880859375, 0.31198883056640625, 0.3316497802734375, 0.35131072998046875, 0.3709716796875, 0.39063262939453125, 0.4102935791015625, 0.42995452880859375, 0.449615478515625, 0.46927642822265625, 0.4889373779296875, 0.5085983276367188, 0.52825927734375, 0.5479202270507812, 0.5675811767578125, 0.5872421264648438, 0.606903076171875, 0.6265640258789062, 0.6462249755859375, 0.6658859252929688, 0.685546875]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 4.0, 7.0, 5.0, 4.0, 20.0, 18.0, 24.0, 23.0, 43.0, 47.0, 66.0, 61.0, 60.0, 85.0, 109.0, 88.0, 61.0, 71.0, 40.0, 31.0, 29.0, 33.0, 17.0, 12.0, 12.0, 6.0, 5.0, 5.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0063018798828125, -0.006111621856689453, -0.005921363830566406, -0.005731105804443359, -0.0055408477783203125, -0.005350589752197266, -0.005160331726074219, -0.004970073699951172, -0.004779815673828125, -0.004589557647705078, -0.004399299621582031, -0.004209041595458984, -0.0040187835693359375, -0.0038285255432128906, -0.0036382675170898438, -0.003448009490966797, -0.00325775146484375, -0.003067493438720703, -0.0028772354125976562, -0.0026869773864746094, -0.0024967193603515625, -0.0023064613342285156, -0.0021162033081054688, -0.0019259452819824219, -0.001735687255859375, -0.0015454292297363281, -0.0013551712036132812, -0.0011649131774902344, -0.0009746551513671875, -0.0007843971252441406, -0.0005941390991210938, -0.0004038810729980469, -0.000213623046875, -2.3365020751953125e-05, 0.00016689300537109375, 0.0003571510314941406, 0.0005474090576171875, 0.0007376670837402344, 0.0009279251098632812, 0.0011181831359863281, 0.001308441162109375, 0.0014986991882324219, 0.0016889572143554688, 0.0018792152404785156, 0.0020694732666015625, 0.0022597312927246094, 0.0024499893188476562, 0.002640247344970703, 0.00283050537109375, 0.003020763397216797, 0.0032110214233398438, 0.0034012794494628906, 0.0035915374755859375, 0.0037817955017089844, 0.003972053527832031, 0.004162311553955078, 0.004352569580078125, 0.004542827606201172, 0.004733085632324219, 0.004923343658447266, 0.0051136016845703125, 0.005303859710693359, 0.005494117736816406, 0.005684375762939453, 0.0058746337890625]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 5.0, 8.0, 3.0, 12.0, 13.0, 16.0, 28.0, 46.0, 56.0, 60.0, 89.0, 178.0, 323.0, 939.0, 416175.0, 628706.0, 983.0, 339.0, 164.0, 120.0, 83.0, 59.0, 38.0, 23.0, 24.0, 14.0, 10.0, 5.0, 4.0, 4.0, 7.0, 6.0, 0.0, 2.0, 4.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1258544921875, -0.12179756164550781, -0.11774063110351562, -0.11368370056152344, -0.10962677001953125, -0.10556983947753906, -0.10151290893554688, -0.09745597839355469, -0.0933990478515625, -0.08934211730957031, -0.08528518676757812, -0.08122825622558594, -0.07717132568359375, -0.07311439514160156, -0.06905746459960938, -0.06500053405761719, -0.060943603515625, -0.05688667297363281, -0.052829742431640625, -0.04877281188964844, -0.04471588134765625, -0.04065895080566406, -0.036602020263671875, -0.03254508972167969, -0.0284881591796875, -0.024431228637695312, -0.020374298095703125, -0.016317367553710938, -0.01226043701171875, -0.008203506469726562, -0.004146575927734375, -8.96453857421875e-05, 0.00396728515625, 0.008024215698242188, 0.012081146240234375, 0.016138076782226562, 0.02019500732421875, 0.024251937866210938, 0.028308868408203125, 0.03236579895019531, 0.0364227294921875, 0.04047966003417969, 0.044536590576171875, 0.04859352111816406, 0.05265045166015625, 0.05670738220214844, 0.060764312744140625, 0.06482124328613281, 0.068878173828125, 0.07293510437011719, 0.07699203491210938, 0.08104896545410156, 0.08510589599609375, 0.08916282653808594, 0.09321975708007812, 0.09727668762207031, 0.1013336181640625, 0.10539054870605469, 0.10944747924804688, 0.11350440979003906, 0.11756134033203125, 0.12161827087402344, 0.12567520141601562, 0.1297321319580078, 0.1337890625]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 31.0, 195.0, 519.0, 215.0, 39.0, 12.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.024682270362973213, -0.02424539066851139, -0.023808512836694717, -0.023371633142232895, -0.022934753447771072, -0.02249787375330925, -0.022060995921492577, -0.021624116227030754, -0.02118723839521408, -0.02075035870075226, -0.020313480868935585, -0.019876601174473763, -0.01943972148001194, -0.019002843648195267, -0.018565963953733444, -0.01812908425927162, -0.0176922045648098, -0.017255324870347977, -0.016818447038531303, -0.01638156734406948, -0.01594468764960766, -0.01550780888646841, -0.015070930123329163, -0.01463405042886734, -0.014197171665728092, -0.013760292902588844, -0.013323413208127022, -0.012886534444987774, -0.012449655681848526, -0.012012775987386703, -0.011575897224247456, -0.011139018461108208, -0.01070213969796896, -0.010265260934829712, -0.00982838124036789, -0.009391502477228642, -0.008954623714089394, -0.008517744019627571, -0.008080865256488323, -0.007643986027687788, -0.007207106798887253, -0.006770227570086718, -0.006333348341286182, -0.0058964695781469345, -0.005459590349346399, -0.005022711120545864, -0.004585832357406616, -0.004148953128606081, -0.003712073899805546, -0.0032751946710050106, -0.002838315675035119, -0.0024014366790652275, -0.0019645574502646923, -0.001527678221464157, -0.0010907992254942656, -0.000653920229524374, -0.0002170410007238388, 0.00021983811166137457, 0.0006567172240465879, 0.0010935963364318013, 0.0015304754488170147, 0.00196735467761755, 0.0024042336735874414, 0.002841112669557333, 0.003277991898357868]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 4.0, 3.0, 5.0, 9.0, 12.0, 20.0, 21.0, 24.0, 27.0, 24.0, 32.0, 51.0, 50.0, 50.0, 53.0, 70.0, 58.0, 60.0, 55.0, 56.0, 48.0, 40.0, 43.0, 33.0, 35.0, 26.0, 16.0, 25.0, 9.0, 10.0, 13.0, 9.0, 6.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003043830394744873, -0.0029310202226042747, -0.0028182100504636765, -0.002705399878323078, -0.00259258970618248, -0.0024797795340418816, -0.0023669693619012833, -0.002254159189760685, -0.0021413490176200867, -0.0020285388454794884, -0.00191572867333889, -0.0018029185011982918, -0.0016901083290576935, -0.0015772981569170952, -0.0014644879847764969, -0.0013516778126358986, -0.0012388676404953003, -0.001126057468354702, -0.0010132472962141037, -0.0009004371240735054, -0.0007876269519329071, -0.0006748167797923088, -0.0005620066076517105, -0.0004491964355111122, -0.0003363862633705139, -0.00022357609122991562, -0.00011076591908931732, 2.0442530512809753e-06, 0.00011485442519187927, 0.00022766459733247757, 0.00034047476947307587, 0.00045328494161367416, 0.0005660951137542725, 0.0006789052858948708, 0.0007917154580354691, 0.0009045256301760674, 0.0010173358023166656, 0.001130145974457264, 0.0012429561465978622, 0.0013557663187384605, 0.0014685764908790588, 0.0015813866630196571, 0.0016941968351602554, 0.0018070070073008537, 0.001919817179441452, 0.0020326273515820503, 0.0021454375237226486, 0.002258247695863247, 0.002371057868003845, 0.0024838680401444435, 0.002596678212285042, 0.00270948838442564, 0.0028222985565662384, 0.0029351087287068367, 0.003047918900847435, 0.0031607290729880333, 0.0032735392451286316, 0.00338634941726923, 0.003499159589409828, 0.0036119697615504265, 0.0037247799336910248, 0.003837590105831623, 0.003950400277972221, 0.00406321045011282, 0.004176020622253418]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 4.0, 2.0, 8.0, 9.0, 8.0, 11.0, 15.0, 15.0, 8.0, 15.0, 20.0, 15.0, 26.0, 28.0, 37.0, 36.0, 27.0, 41.0, 38.0, 38.0, 44.0, 57.0, 42.0, 43.0, 36.0, 49.0, 37.0, 42.0, 31.0, 29.0, 28.0, 25.0, 22.0, 23.0, 7.0, 19.0, 10.0, 10.0, 12.0, 9.0, 13.0, 4.0, 3.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0], "bins": [-7.6328125, -7.4022216796875, -7.171630859375, -6.9410400390625, -6.71044921875, -6.4798583984375, -6.249267578125, -6.0186767578125, -5.7880859375, -5.5574951171875, -5.326904296875, -5.0963134765625, -4.86572265625, -4.6351318359375, -4.404541015625, -4.1739501953125, -3.943359375, -3.7127685546875, -3.482177734375, -3.2515869140625, -3.02099609375, -2.7904052734375, -2.559814453125, -2.3292236328125, -2.0986328125, -1.8680419921875, -1.637451171875, -1.4068603515625, -1.17626953125, -0.9456787109375, -0.715087890625, -0.4844970703125, -0.25390625, -0.0233154296875, 0.207275390625, 0.4378662109375, 0.66845703125, 0.8990478515625, 1.129638671875, 1.3602294921875, 1.5908203125, 1.8214111328125, 2.052001953125, 2.2825927734375, 2.51318359375, 2.7437744140625, 2.974365234375, 3.2049560546875, 3.435546875, 3.6661376953125, 3.896728515625, 4.1273193359375, 4.35791015625, 4.5885009765625, 4.819091796875, 5.0496826171875, 5.2802734375, 5.5108642578125, 5.741455078125, 5.9720458984375, 6.20263671875, 6.4332275390625, 6.663818359375, 6.8944091796875, 7.125]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 0.0, 3.0, 5.0, 2.0, 10.0, 11.0, 6.0, 11.0, 20.0, 21.0, 20.0, 17.0, 46.0, 51.0, 56.0, 78.0, 129.0, 190.0, 270.0, 510.0, 1322.0, 4434.0, 18351.0, 111371.0, 774742.0, 111073.0, 18458.0, 4495.0, 1354.0, 564.0, 299.0, 160.0, 111.0, 87.0, 66.0, 56.0, 30.0, 31.0, 21.0, 19.0, 12.0, 16.0, 10.0, 8.0, 3.0, 1.0, 6.0, 2.0, 1.0, 3.0, 0.0, 0.0, 3.0, 2.0, 1.0], "bins": [-15.1796875, -14.7265625, -14.2734375, -13.8203125, -13.3671875, -12.9140625, -12.4609375, -12.0078125, -11.5546875, -11.1015625, -10.6484375, -10.1953125, -9.7421875, -9.2890625, -8.8359375, -8.3828125, -7.9296875, -7.4765625, -7.0234375, -6.5703125, -6.1171875, -5.6640625, -5.2109375, -4.7578125, -4.3046875, -3.8515625, -3.3984375, -2.9453125, -2.4921875, -2.0390625, -1.5859375, -1.1328125, -0.6796875, -0.2265625, 0.2265625, 0.6796875, 1.1328125, 1.5859375, 2.0390625, 2.4921875, 2.9453125, 3.3984375, 3.8515625, 4.3046875, 4.7578125, 5.2109375, 5.6640625, 6.1171875, 6.5703125, 7.0234375, 7.4765625, 7.9296875, 8.3828125, 8.8359375, 9.2890625, 9.7421875, 10.1953125, 10.6484375, 11.1015625, 11.5546875, 12.0078125, 12.4609375, 12.9140625, 13.3671875, 13.8203125]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 7.0, 3.0, 4.0, 7.0, 5.0, 12.0, 14.0, 14.0, 18.0, 18.0, 23.0, 33.0, 30.0, 48.0, 41.0, 44.0, 53.0, 51.0, 79.0, 227.0, 1699.0, 158.0, 76.0, 64.0, 40.0, 36.0, 37.0, 35.0, 28.0, 23.0, 24.0, 25.0, 20.0, 9.0, 7.0, 13.0, 5.0, 9.0, 5.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.109375, -22.375244140625, -21.64111328125, -20.906982421875, -20.1728515625, -19.438720703125, -18.70458984375, -17.970458984375, -17.236328125, -16.502197265625, -15.76806640625, -15.033935546875, -14.2998046875, -13.565673828125, -12.83154296875, -12.097412109375, -11.36328125, -10.629150390625, -9.89501953125, -9.160888671875, -8.4267578125, -7.692626953125, -6.95849609375, -6.224365234375, -5.490234375, -4.756103515625, -4.02197265625, -3.287841796875, -2.5537109375, -1.819580078125, -1.08544921875, -0.351318359375, 0.3828125, 1.116943359375, 1.85107421875, 2.585205078125, 3.3193359375, 4.053466796875, 4.78759765625, 5.521728515625, 6.255859375, 6.989990234375, 7.72412109375, 8.458251953125, 9.1923828125, 9.926513671875, 10.66064453125, 11.394775390625, 12.12890625, 12.863037109375, 13.59716796875, 14.331298828125, 15.0654296875, 15.799560546875, 16.53369140625, 17.267822265625, 18.001953125, 18.736083984375, 19.47021484375, 20.204345703125, 20.9384765625, 21.672607421875, 22.40673828125, 23.140869140625, 23.875]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 7.0, 10.0, 10.0, 10.0, 6.0, 8.0, 24.0, 28.0, 24.0, 53.0, 47.0, 55.0, 71.0, 120.0, 183.0, 371.0, 1139.0, 27149.0, 3096117.0, 18180.0, 1026.0, 374.0, 178.0, 133.0, 94.0, 62.0, 45.0, 36.0, 32.0, 22.0, 25.0, 15.0, 16.0, 7.0, 7.0, 7.0, 3.0, 5.0, 8.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-55.78125, -54.0625, -52.34375, -50.625, -48.90625, -47.1875, -45.46875, -43.75, -42.03125, -40.3125, -38.59375, -36.875, -35.15625, -33.4375, -31.71875, -30.0, -28.28125, -26.5625, -24.84375, -23.125, -21.40625, -19.6875, -17.96875, -16.25, -14.53125, -12.8125, -11.09375, -9.375, -7.65625, -5.9375, -4.21875, -2.5, -0.78125, 0.9375, 2.65625, 4.375, 6.09375, 7.8125, 9.53125, 11.25, 12.96875, 14.6875, 16.40625, 18.125, 19.84375, 21.5625, 23.28125, 25.0, 26.71875, 28.4375, 30.15625, 31.875, 33.59375, 35.3125, 37.03125, 38.75, 40.46875, 42.1875, 43.90625, 45.625, 47.34375, 49.0625, 50.78125, 52.5, 54.21875]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 8.0, 14.0, 24.0, 38.0, 64.0, 113.0, 136.0, 149.0, 166.0, 103.0, 83.0, 47.0, 32.0, 16.0, 9.0, 4.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.8138370513916, -28.0267391204834, -27.239639282226562, -26.45254135131836, -25.665443420410156, -24.878345489501953, -24.091245651245117, -23.304147720336914, -22.517047882080078, -21.729949951171875, -20.94285011291504, -20.155752182006836, -19.368654251098633, -18.581554412841797, -17.794456481933594, -17.00735855102539, -16.220260620117188, -15.433161735534668, -14.646063804626465, -13.858964920043945, -13.071866989135742, -12.284768104553223, -11.497669219970703, -10.7105712890625, -9.92347240447998, -9.136373519897461, -8.349275588989258, -7.562176704406738, -6.775078296661377, -5.987979888916016, -5.200881004333496, -4.413782596588135, -3.6266841888427734, -2.839585781097412, -2.0524871349334717, -1.2653884887695312, -0.4782900810241699, 0.3088083267211914, 1.095907211303711, 1.8830056190490723, 2.6701040267944336, 3.457202434539795, 4.244300842285156, 5.031399726867676, 5.818498134613037, 6.605596542358398, 7.392695426940918, 8.179794311523438, 8.96689224243164, 9.75399112701416, 10.541089057922363, 11.328187942504883, 12.115285873413086, 12.902384757995605, 13.689483642578125, 14.476581573486328, 15.263680458068848, 16.050779342651367, 16.83787727355957, 17.624977111816406, 18.41207504272461, 19.199172973632812, 19.986270904541016, 20.77337074279785, 21.560468673706055]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 8.0, 8.0, 11.0, 8.0, 8.0, 10.0, 6.0, 12.0, 14.0, 16.0, 19.0, 22.0, 21.0, 29.0, 24.0, 34.0, 25.0, 30.0, 34.0, 24.0, 34.0, 36.0, 34.0, 35.0, 27.0, 36.0, 41.0, 34.0, 29.0, 30.0, 33.0, 23.0, 27.0, 27.0, 13.0, 26.0, 18.0, 22.0, 14.0, 22.0, 15.0, 13.0, 8.0, 8.0, 6.0, 5.0, 7.0, 5.0, 4.0, 1.0, 3.0, 4.0, 1.0, 3.0, 2.0, 2.0], "bins": [-47.50079345703125, -46.00641632080078, -44.51204299926758, -43.017669677734375, -41.523292541503906, -40.02891540527344, -38.534542083740234, -37.04016876220703, -35.54579162597656, -34.051414489746094, -32.55704116821289, -31.062665939331055, -29.56829071044922, -28.073915481567383, -26.579540252685547, -25.08516502380371, -23.590789794921875, -22.09641456604004, -20.602039337158203, -19.107664108276367, -17.61328887939453, -16.118913650512695, -14.62453842163086, -13.130163192749023, -11.635787963867188, -10.141412734985352, -8.647037506103516, -7.15266227722168, -5.658287048339844, -4.163911819458008, -2.669536590576172, -1.175161361694336, 0.3192138671875, 1.813589096069336, 3.307964324951172, 4.802339553833008, 6.296714782714844, 7.79109001159668, 9.285465240478516, 10.779840469360352, 12.274215698242188, 13.768590927124023, 15.26296615600586, 16.757341384887695, 18.25171661376953, 19.746091842651367, 21.240467071533203, 22.73484230041504, 24.229217529296875, 25.72359275817871, 27.217967987060547, 28.712343215942383, 30.20671844482422, 31.701093673706055, 33.19546890258789, 34.689842224121094, 36.18421936035156, 37.67859649658203, 39.172969818115234, 40.66734313964844, 42.161720275878906, 43.656097412109375, 45.15047073364258, 46.64484405517578, 48.13922119140625]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 2.0, 1.0, 3.0, 8.0, 6.0, 7.0, 8.0, 12.0, 14.0, 13.0, 21.0, 14.0, 17.0, 27.0, 19.0, 25.0, 23.0, 26.0, 28.0, 46.0, 41.0, 42.0, 45.0, 48.0, 38.0, 50.0, 37.0, 38.0, 30.0, 32.0, 31.0, 28.0, 30.0, 25.0, 26.0, 22.0, 22.0, 16.0, 19.0, 7.0, 16.0, 9.0, 5.0, 5.0, 8.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 4.0, 2.0], "bins": [-7.4375, -7.214599609375, -6.99169921875, -6.768798828125, -6.5458984375, -6.322998046875, -6.10009765625, -5.877197265625, -5.654296875, -5.431396484375, -5.20849609375, -4.985595703125, -4.7626953125, -4.539794921875, -4.31689453125, -4.093994140625, -3.87109375, -3.648193359375, -3.42529296875, -3.202392578125, -2.9794921875, -2.756591796875, -2.53369140625, -2.310791015625, -2.087890625, -1.864990234375, -1.64208984375, -1.419189453125, -1.1962890625, -0.973388671875, -0.75048828125, -0.527587890625, -0.3046875, -0.081787109375, 0.14111328125, 0.364013671875, 0.5869140625, 0.809814453125, 1.03271484375, 1.255615234375, 1.478515625, 1.701416015625, 1.92431640625, 2.147216796875, 2.3701171875, 2.593017578125, 2.81591796875, 3.038818359375, 3.26171875, 3.484619140625, 3.70751953125, 3.930419921875, 4.1533203125, 4.376220703125, 4.59912109375, 4.822021484375, 5.044921875, 5.267822265625, 5.49072265625, 5.713623046875, 5.9365234375, 6.159423828125, 6.38232421875, 6.605224609375, 6.828125]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 11.0, 6.0, 7.0, 7.0, 12.0, 16.0, 15.0, 23.0, 23.0, 33.0, 60.0, 88.0, 175.0, 381.0, 860.0, 2049.0, 5765.0, 18413.0, 98842.0, 1260143.0, 2498718.0, 261025.0, 33046.0, 8837.0, 3244.0, 1261.0, 538.0, 274.0, 126.0, 66.0, 40.0, 35.0, 24.0, 29.0, 17.0, 17.0, 11.0, 6.0, 8.0, 6.0, 7.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.1875, -16.618408203125, -16.04931640625, -15.480224609375, -14.9111328125, -14.342041015625, -13.77294921875, -13.203857421875, -12.634765625, -12.065673828125, -11.49658203125, -10.927490234375, -10.3583984375, -9.789306640625, -9.22021484375, -8.651123046875, -8.08203125, -7.512939453125, -6.94384765625, -6.374755859375, -5.8056640625, -5.236572265625, -4.66748046875, -4.098388671875, -3.529296875, -2.960205078125, -2.39111328125, -1.822021484375, -1.2529296875, -0.683837890625, -0.11474609375, 0.454345703125, 1.0234375, 1.592529296875, 2.16162109375, 2.730712890625, 3.2998046875, 3.868896484375, 4.43798828125, 5.007080078125, 5.576171875, 6.145263671875, 6.71435546875, 7.283447265625, 7.8525390625, 8.421630859375, 8.99072265625, 9.559814453125, 10.12890625, 10.697998046875, 11.26708984375, 11.836181640625, 12.4052734375, 12.974365234375, 13.54345703125, 14.112548828125, 14.681640625, 15.250732421875, 15.81982421875, 16.388916015625, 16.9580078125, 17.527099609375, 18.09619140625, 18.665283203125, 19.234375]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 6.0, 9.0, 7.0, 9.0, 14.0, 26.0, 24.0, 27.0, 28.0, 56.0, 72.0, 80.0, 108.0, 137.0, 217.0, 293.0, 365.0, 440.0, 484.0, 435.0, 323.0, 222.0, 176.0, 132.0, 101.0, 76.0, 65.0, 40.0, 26.0, 19.0, 10.0, 16.0, 11.0, 10.0, 2.0, 5.0, 3.0, 4.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.8671875, -11.48779296875, -11.1083984375, -10.72900390625, -10.349609375, -9.97021484375, -9.5908203125, -9.21142578125, -8.83203125, -8.45263671875, -8.0732421875, -7.69384765625, -7.314453125, -6.93505859375, -6.5556640625, -6.17626953125, -5.796875, -5.41748046875, -5.0380859375, -4.65869140625, -4.279296875, -3.89990234375, -3.5205078125, -3.14111328125, -2.76171875, -2.38232421875, -2.0029296875, -1.62353515625, -1.244140625, -0.86474609375, -0.4853515625, -0.10595703125, 0.2734375, 0.65283203125, 1.0322265625, 1.41162109375, 1.791015625, 2.17041015625, 2.5498046875, 2.92919921875, 3.30859375, 3.68798828125, 4.0673828125, 4.44677734375, 4.826171875, 5.20556640625, 5.5849609375, 5.96435546875, 6.34375, 6.72314453125, 7.1025390625, 7.48193359375, 7.861328125, 8.24072265625, 8.6201171875, 8.99951171875, 9.37890625, 9.75830078125, 10.1376953125, 10.51708984375, 10.896484375, 11.27587890625, 11.6552734375, 12.03466796875, 12.4140625]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 11.0, 5.0, 6.0, 10.0, 14.0, 20.0, 29.0, 33.0, 56.0, 57.0, 81.0, 87.0, 142.0, 219.0, 375.0, 776.0, 2893.0, 23831.0, 688139.0, 3395488.0, 73070.0, 6282.0, 1250.0, 477.0, 249.0, 173.0, 127.0, 89.0, 79.0, 49.0, 42.0, 25.0, 27.0, 19.0, 14.0, 12.0, 5.0, 6.0, 3.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0], "bins": [-48.5, -47.23046875, -45.9609375, -44.69140625, -43.421875, -42.15234375, -40.8828125, -39.61328125, -38.34375, -37.07421875, -35.8046875, -34.53515625, -33.265625, -31.99609375, -30.7265625, -29.45703125, -28.1875, -26.91796875, -25.6484375, -24.37890625, -23.109375, -21.83984375, -20.5703125, -19.30078125, -18.03125, -16.76171875, -15.4921875, -14.22265625, -12.953125, -11.68359375, -10.4140625, -9.14453125, -7.875, -6.60546875, -5.3359375, -4.06640625, -2.796875, -1.52734375, -0.2578125, 1.01171875, 2.28125, 3.55078125, 4.8203125, 6.08984375, 7.359375, 8.62890625, 9.8984375, 11.16796875, 12.4375, 13.70703125, 14.9765625, 16.24609375, 17.515625, 18.78515625, 20.0546875, 21.32421875, 22.59375, 23.86328125, 25.1328125, 26.40234375, 27.671875, 28.94140625, 30.2109375, 31.48046875, 32.75]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 10.0, 15.0, 29.0, 37.0, 75.0, 138.0, 190.0, 196.0, 134.0, 80.0, 59.0, 26.0, 8.0, 9.0, 1.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-105.93444061279297, -103.53251647949219, -101.13058471679688, -98.7286605834961, -96.32673645019531, -93.9248046875, -91.52288055419922, -89.12095642089844, -86.71902465820312, -84.31710052490234, -81.91516876220703, -79.51324462890625, -77.11131286621094, -74.70938873291016, -72.30746459960938, -69.90553283691406, -67.50360870361328, -65.1016845703125, -62.69975280761719, -60.297828674316406, -57.89590072631836, -55.49397277832031, -53.09204864501953, -50.690120697021484, -48.28819274902344, -45.88626480102539, -43.484336853027344, -41.08241271972656, -38.680484771728516, -36.27855682373047, -33.87663269042969, -31.47470474243164, -29.072784423828125, -26.670856475830078, -24.268930435180664, -21.86700439453125, -19.465076446533203, -17.063148498535156, -14.661222457885742, -12.259296417236328, -9.857368469238281, -7.455441474914551, -5.05351448059082, -2.65158748626709, -0.24966049194335938, 2.152266502380371, 4.554193496704102, 6.956119537353516, 9.358047485351562, 11.759974479675293, 14.161901473999023, 16.563827514648438, 18.965755462646484, 21.36768341064453, 23.769609451293945, 26.17153549194336, 28.573463439941406, 30.975391387939453, 33.3773193359375, 35.77924346923828, 38.18117141723633, 40.583099365234375, 42.985023498535156, 45.3869514465332, 47.78887939453125]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 2.0, 3.0, 2.0, 3.0, 6.0, 5.0, 5.0, 10.0, 6.0, 20.0, 17.0, 18.0, 24.0, 16.0, 31.0, 33.0, 31.0, 32.0, 32.0, 41.0, 40.0, 42.0, 38.0, 46.0, 35.0, 40.0, 56.0, 52.0, 35.0, 42.0, 32.0, 33.0, 25.0, 16.0, 19.0, 23.0, 21.0, 13.0, 13.0, 6.0, 9.0, 7.0, 5.0, 3.0, 10.0, 2.0, 7.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-46.097259521484375, -44.75735092163086, -43.41743850708008, -42.07752990722656, -40.73761749267578, -39.397708892822266, -38.05780029296875, -36.71788787841797, -35.37797546386719, -34.03806686401367, -32.69815444946289, -31.358245849609375, -30.018333435058594, -28.678424835205078, -27.33851432800293, -25.99860382080078, -24.658695220947266, -23.318784713745117, -21.97887420654297, -20.638965606689453, -19.299053192138672, -17.959144592285156, -16.619234085083008, -15.27932357788086, -13.939413070678711, -12.599502563476562, -11.259592056274414, -9.919682502746582, -8.579771995544434, -7.239861488342285, -5.899951934814453, -4.560041427612305, -3.2201309204101562, -1.880220651626587, -0.5403103828430176, 0.7995996475219727, 2.139510154724121, 3.4794206619262695, 4.819330215454102, 6.15924072265625, 7.499151229858398, 8.839061737060547, 10.178972244262695, 11.518881797790527, 12.858792304992676, 14.198702812194824, 15.538612365722656, 16.878522872924805, 18.218433380126953, 19.5583438873291, 20.89825439453125, 22.238162994384766, 23.578075408935547, 24.917984008789062, 26.25789451599121, 27.59780502319336, 28.937715530395508, 30.277626037597656, 31.617536544799805, 32.95744705200195, 34.29735565185547, 35.63726806640625, 36.977176666259766, 38.31708526611328, 39.65699768066406]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 6.0, 4.0, 2.0, 7.0, 3.0, 8.0, 15.0, 15.0, 15.0, 14.0, 17.0, 13.0, 19.0, 22.0, 26.0, 24.0, 24.0, 38.0, 33.0, 35.0, 38.0, 40.0, 39.0, 41.0, 32.0, 38.0, 34.0, 42.0, 44.0, 37.0, 35.0, 32.0, 34.0, 28.0, 14.0, 17.0, 27.0, 20.0, 15.0, 12.0, 11.0, 4.0, 11.0, 5.0, 5.0, 5.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-7.35546875, -7.12518310546875, -6.8948974609375, -6.66461181640625, -6.434326171875, -6.20404052734375, -5.9737548828125, -5.74346923828125, -5.51318359375, -5.28289794921875, -5.0526123046875, -4.82232666015625, -4.592041015625, -4.36175537109375, -4.1314697265625, -3.90118408203125, -3.6708984375, -3.44061279296875, -3.2103271484375, -2.98004150390625, -2.749755859375, -2.51947021484375, -2.2891845703125, -2.05889892578125, -1.82861328125, -1.59832763671875, -1.3680419921875, -1.13775634765625, -0.907470703125, -0.67718505859375, -0.4468994140625, -0.21661376953125, 0.013671875, 0.24395751953125, 0.4742431640625, 0.70452880859375, 0.934814453125, 1.16510009765625, 1.3953857421875, 1.62567138671875, 1.85595703125, 2.08624267578125, 2.3165283203125, 2.54681396484375, 2.777099609375, 3.00738525390625, 3.2376708984375, 3.46795654296875, 3.6982421875, 3.92852783203125, 4.1588134765625, 4.38909912109375, 4.619384765625, 4.84967041015625, 5.0799560546875, 5.31024169921875, 5.54052734375, 5.77081298828125, 6.0010986328125, 6.23138427734375, 6.461669921875, 6.69195556640625, 6.9222412109375, 7.15252685546875, 7.3828125]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 1.0, 4.0, 4.0, 8.0, 13.0, 24.0, 27.0, 43.0, 71.0, 96.0, 125.0, 216.0, 306.0, 429.0, 621.0, 903.0, 1327.0, 1927.0, 2816.0, 4178.0, 5926.0, 8857.0, 12667.0, 19026.0, 27304.0, 40205.0, 58832.0, 85279.0, 118523.0, 148898.0, 144507.0, 112765.0, 80016.0, 54784.0, 37284.0, 25655.0, 17344.0, 11671.0, 8192.0, 5649.0, 3821.0, 2566.0, 1770.0, 1236.0, 793.0, 600.0, 385.0, 273.0, 178.0, 136.0, 86.0, 68.0, 43.0, 35.0, 21.0, 14.0, 6.0, 5.0, 5.0, 4.0, 2.0], "bins": [-0.63134765625, -0.6121597290039062, -0.5929718017578125, -0.5737838745117188, -0.554595947265625, -0.5354080200195312, -0.5162200927734375, -0.49703216552734375, -0.47784423828125, -0.45865631103515625, -0.4394683837890625, -0.42028045654296875, -0.401092529296875, -0.38190460205078125, -0.3627166748046875, -0.34352874755859375, -0.3243408203125, -0.30515289306640625, -0.2859649658203125, -0.26677703857421875, -0.247589111328125, -0.22840118408203125, -0.2092132568359375, -0.19002532958984375, -0.17083740234375, -0.15164947509765625, -0.1324615478515625, -0.11327362060546875, -0.094085693359375, -0.07489776611328125, -0.0557098388671875, -0.03652191162109375, -0.017333984375, 0.00185394287109375, 0.0210418701171875, 0.04022979736328125, 0.059417724609375, 0.07860565185546875, 0.0977935791015625, 0.11698150634765625, 0.13616943359375, 0.15535736083984375, 0.1745452880859375, 0.19373321533203125, 0.212921142578125, 0.23210906982421875, 0.2512969970703125, 0.27048492431640625, 0.2896728515625, 0.30886077880859375, 0.3280487060546875, 0.34723663330078125, 0.366424560546875, 0.38561248779296875, 0.4048004150390625, 0.42398834228515625, 0.44317626953125, 0.46236419677734375, 0.4815521240234375, 0.5007400512695312, 0.519927978515625, 0.5391159057617188, 0.5583038330078125, 0.5774917602539062, 0.5966796875]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 5.0, 7.0, 5.0, 7.0, 7.0, 10.0, 16.0, 18.0, 22.0, 15.0, 25.0, 29.0, 23.0, 20.0, 29.0, 28.0, 46.0, 38.0, 45.0, 36.0, 33.0, 32.0, 1055.0, 39.0, 46.0, 46.0, 30.0, 25.0, 43.0, 26.0, 22.0, 25.0, 27.0, 21.0, 28.0, 17.0, 13.0, 15.0, 13.0, 11.0, 4.0, 10.0, 5.0, 8.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.8359375, -4.68878173828125, -4.5416259765625, -4.39447021484375, -4.247314453125, -4.10015869140625, -3.9530029296875, -3.80584716796875, -3.65869140625, -3.51153564453125, -3.3643798828125, -3.21722412109375, -3.070068359375, -2.92291259765625, -2.7757568359375, -2.62860107421875, -2.4814453125, -2.33428955078125, -2.1871337890625, -2.03997802734375, -1.892822265625, -1.74566650390625, -1.5985107421875, -1.45135498046875, -1.30419921875, -1.15704345703125, -1.0098876953125, -0.86273193359375, -0.715576171875, -0.56842041015625, -0.4212646484375, -0.27410888671875, -0.126953125, 0.02020263671875, 0.1673583984375, 0.31451416015625, 0.461669921875, 0.60882568359375, 0.7559814453125, 0.90313720703125, 1.05029296875, 1.19744873046875, 1.3446044921875, 1.49176025390625, 1.638916015625, 1.78607177734375, 1.9332275390625, 2.08038330078125, 2.2275390625, 2.37469482421875, 2.5218505859375, 2.66900634765625, 2.816162109375, 2.96331787109375, 3.1104736328125, 3.25762939453125, 3.40478515625, 3.55194091796875, 3.6990966796875, 3.84625244140625, 3.993408203125, 4.14056396484375, 4.2877197265625, 4.43487548828125, 4.58203125]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 5.0, 5.0, 12.0, 10.0, 11.0, 29.0, 43.0, 41.0, 72.0, 120.0, 193.0, 285.0, 465.0, 714.0, 1186.0, 1803.0, 2966.0, 4363.0, 6714.0, 10379.0, 16068.0, 25077.0, 38331.0, 58337.0, 86205.0, 119207.0, 317434.0, 1025026.0, 121630.0, 87719.0, 60397.0, 39616.0, 25724.0, 16723.0, 10650.0, 6950.0, 4502.0, 2854.0, 1886.0, 1204.0, 764.0, 510.0, 336.0, 212.0, 146.0, 79.0, 44.0, 34.0, 23.0, 11.0, 13.0, 6.0, 7.0, 5.0, 1.0, 2.0], "bins": [-0.59814453125, -0.5810699462890625, -0.563995361328125, -0.5469207763671875, -0.52984619140625, -0.5127716064453125, -0.495697021484375, -0.4786224365234375, -0.4615478515625, -0.4444732666015625, -0.427398681640625, -0.4103240966796875, -0.39324951171875, -0.3761749267578125, -0.359100341796875, -0.3420257568359375, -0.324951171875, -0.3078765869140625, -0.290802001953125, -0.2737274169921875, -0.25665283203125, -0.2395782470703125, -0.222503662109375, -0.2054290771484375, -0.1883544921875, -0.1712799072265625, -0.154205322265625, -0.1371307373046875, -0.12005615234375, -0.1029815673828125, -0.085906982421875, -0.0688323974609375, -0.0517578125, -0.0346832275390625, -0.017608642578125, -0.0005340576171875, 0.01654052734375, 0.0336151123046875, 0.050689697265625, 0.0677642822265625, 0.0848388671875, 0.1019134521484375, 0.118988037109375, 0.1360626220703125, 0.15313720703125, 0.1702117919921875, 0.187286376953125, 0.2043609619140625, 0.221435546875, 0.2385101318359375, 0.255584716796875, 0.2726593017578125, 0.28973388671875, 0.3068084716796875, 0.323883056640625, 0.3409576416015625, 0.3580322265625, 0.3751068115234375, 0.392181396484375, 0.4092559814453125, 0.42633056640625, 0.4434051513671875, 0.460479736328125, 0.4775543212890625, 0.49462890625]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 5.0, 8.0, 6.0, 2.0, 10.0, 7.0, 14.0, 13.0, 29.0, 39.0, 39.0, 44.0, 59.0, 80.0, 101.0, 83.0, 86.0, 85.0, 80.0, 50.0, 41.0, 25.0, 28.0, 17.0, 10.0, 9.0, 6.0, 8.0, 7.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.005615234375, -0.00545269250869751, -0.0052901506423950195, -0.005127608776092529, -0.004965066909790039, -0.004802525043487549, -0.004639983177185059, -0.004477441310882568, -0.004314899444580078, -0.004152357578277588, -0.003989815711975098, -0.0038272738456726074, -0.003664731979370117, -0.003502190113067627, -0.0033396482467651367, -0.0031771063804626465, -0.0030145645141601562, -0.002852022647857666, -0.0026894807815551758, -0.0025269389152526855, -0.0023643970489501953, -0.002201855182647705, -0.002039313316345215, -0.0018767714500427246, -0.0017142295837402344, -0.0015516877174377441, -0.001389145851135254, -0.0012266039848327637, -0.0010640621185302734, -0.0009015202522277832, -0.000738978385925293, -0.0005764365196228027, -0.0004138946533203125, -0.00025135278701782227, -8.881092071533203e-05, 7.37309455871582e-05, 0.00023627281188964844, 0.00039881467819213867, 0.0005613565444946289, 0.0007238984107971191, 0.0008864402770996094, 0.0010489821434020996, 0.0012115240097045898, 0.00137406587600708, 0.0015366077423095703, 0.0016991496086120605, 0.0018616914749145508, 0.002024233341217041, 0.0021867752075195312, 0.0023493170738220215, 0.0025118589401245117, 0.002674400806427002, 0.002836942672729492, 0.0029994845390319824, 0.0031620264053344727, 0.003324568271636963, 0.003487110137939453, 0.0036496520042419434, 0.0038121938705444336, 0.003974735736846924, 0.004137277603149414, 0.004299819469451904, 0.0044623613357543945, 0.004624903202056885, 0.004787445068359375]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0, 3.0, 4.0, 2.0, 9.0, 8.0, 8.0, 10.0, 15.0, 28.0, 33.0, 50.0, 73.0, 112.0, 167.0, 338.0, 872.0, 164677.0, 879786.0, 1361.0, 372.0, 207.0, 122.0, 86.0, 59.0, 37.0, 22.0, 29.0, 9.0, 17.0, 7.0, 8.0, 7.0, 5.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.096435546875, -0.09300422668457031, -0.08957290649414062, -0.08614158630371094, -0.08271026611328125, -0.07927894592285156, -0.07584762573242188, -0.07241630554199219, -0.0689849853515625, -0.06555366516113281, -0.062122344970703125, -0.05869102478027344, -0.05525970458984375, -0.05182838439941406, -0.048397064208984375, -0.04496574401855469, -0.041534423828125, -0.03810310363769531, -0.034671783447265625, -0.031240463256835938, -0.02780914306640625, -0.024377822875976562, -0.020946502685546875, -0.017515182495117188, -0.0140838623046875, -0.010652542114257812, -0.007221221923828125, -0.0037899017333984375, -0.00035858154296875, 0.0030727386474609375, 0.006504058837890625, 0.009935379028320312, 0.01336669921875, 0.016798019409179688, 0.020229339599609375, 0.023660659790039062, 0.02709197998046875, 0.030523300170898438, 0.033954620361328125, 0.03738594055175781, 0.0408172607421875, 0.04424858093261719, 0.047679901123046875, 0.05111122131347656, 0.05454254150390625, 0.05797386169433594, 0.061405181884765625, 0.06483650207519531, 0.068267822265625, 0.07169914245605469, 0.07513046264648438, 0.07856178283691406, 0.08199310302734375, 0.08542442321777344, 0.08885574340820312, 0.09228706359863281, 0.0957183837890625, 0.09914970397949219, 0.10258102416992188, 0.10601234436035156, 0.10944366455078125, 0.11287498474121094, 0.11630630493164062, 0.11973762512207031, 0.1231689453125]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 9.0, 129.0, 702.0, 170.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.012886013835668564, -0.012287216261029243, -0.011688417755067348, -0.011089619249105453, -0.010490821674466133, -0.009892024099826813, -0.009293225593864918, -0.008694427087903023, -0.008095629513263702, -0.007496831472963095, -0.006898033432662487, -0.006299235392361879, -0.005700437352061272, -0.005101639311760664, -0.004502841271460056, -0.0039040432311594486, -0.003305245190858841, -0.0027064471505582333, -0.0021076491102576256, -0.001508851069957018, -0.0009100530296564102, -0.00031125498935580254, 0.00028754305094480515, 0.0008863410912454128, 0.0014851391315460205, 0.002083937171846628, 0.002682735212147236, 0.0032815332524478436, 0.0038803312927484512, 0.004479129333049059, 0.005077927373349667, 0.005676725413650274, 0.006275523453950882, 0.00687432149425149, 0.007473119534552097, 0.008071918040513992, 0.008670715615153313, 0.009269513189792633, 0.009868311695754528, 0.010467110201716423, 0.011065907776355743, 0.011664705350995064, 0.012263503856956959, 0.012862302362918854, 0.013461099937558174, 0.014059897512197495, 0.01465869601815939, 0.015257494524121284, 0.015856292098760605, 0.016455089673399925, 0.017053887248039246, 0.017652686685323715, 0.018251484259963036, 0.018850281834602356, 0.019449081271886826, 0.020047878846526146, 0.020646676421165466, 0.021245473995804787, 0.021844271570444107, 0.022443071007728577, 0.023041868582367897, 0.023640666157007217, 0.024239465594291687, 0.024838263168931007, 0.025437060743570328]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 4.0, 7.0, 9.0, 7.0, 6.0, 8.0, 12.0, 16.0, 22.0, 15.0, 15.0, 19.0, 23.0, 29.0, 28.0, 24.0, 28.0, 34.0, 34.0, 36.0, 33.0, 32.0, 42.0, 36.0, 34.0, 39.0, 47.0, 30.0, 33.0, 32.0, 40.0, 38.0, 30.0, 27.0, 24.0, 18.0, 20.0, 22.0, 16.0, 4.0, 7.0, 5.0, 5.0, 4.0, 5.0, 2.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.002066671848297119, -0.002003171481192112, -0.0019396711140871048, -0.0018761707469820976, -0.0018126703798770905, -0.0017491700127720833, -0.0016856696456670761, -0.001622169278562069, -0.0015586689114570618, -0.0014951685443520546, -0.0014316681772470474, -0.0013681678101420403, -0.001304667443037033, -0.001241167075932026, -0.0011776667088270187, -0.0011141663417220116, -0.0010506659746170044, -0.0009871656075119972, -0.00092366524040699, -0.0008601648733019829, -0.0007966645061969757, -0.0007331641390919685, -0.0006696637719869614, -0.0006061634048819542, -0.000542663037776947, -0.00047916267067193985, -0.0004156623035669327, -0.0003521619364619255, -0.00028866156935691833, -0.00022516120225191116, -0.000161660835146904, -9.816046804189682e-05, -3.466010093688965e-05, 2.8840266168117523e-05, 9.23406332731247e-05, 0.00015584100037813187, 0.00021934136748313904, 0.0002828417345881462, 0.0003463421016931534, 0.00040984246879816055, 0.0004733428359031677, 0.0005368432030081749, 0.0006003435701131821, 0.0006638439372181892, 0.0007273443043231964, 0.0007908446714282036, 0.0008543450385332108, 0.0009178454056382179, 0.000981345772743225, 0.0010448461398482323, 0.0011083465069532394, 0.0011718468740582466, 0.0012353472411632538, 0.001298847608268261, 0.0013623479753732681, 0.0014258483424782753, 0.0014893487095832825, 0.0015528490766882896, 0.0016163494437932968, 0.001679849810898304, 0.0017433501780033112, 0.0018068505451083183, 0.0018703509122133255, 0.0019338512793183327, 0.00199735164642334]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 6.0, 4.0, 2.0, 7.0, 3.0, 7.0, 16.0, 15.0, 15.0, 14.0, 17.0, 13.0, 19.0, 22.0, 26.0, 24.0, 24.0, 38.0, 32.0, 36.0, 37.0, 40.0, 40.0, 41.0, 32.0, 38.0, 33.0, 43.0, 44.0, 37.0, 35.0, 32.0, 34.0, 28.0, 14.0, 17.0, 27.0, 20.0, 15.0, 12.0, 10.0, 5.0, 11.0, 5.0, 5.0, 5.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-7.359375, -7.1290283203125, -6.898681640625, -6.6683349609375, -6.43798828125, -6.2076416015625, -5.977294921875, -5.7469482421875, -5.5166015625, -5.2862548828125, -5.055908203125, -4.8255615234375, -4.59521484375, -4.3648681640625, -4.134521484375, -3.9041748046875, -3.673828125, -3.4434814453125, -3.213134765625, -2.9827880859375, -2.75244140625, -2.5220947265625, -2.291748046875, -2.0614013671875, -1.8310546875, -1.6007080078125, -1.370361328125, -1.1400146484375, -0.90966796875, -0.6793212890625, -0.448974609375, -0.2186279296875, 0.01171875, 0.2420654296875, 0.472412109375, 0.7027587890625, 0.93310546875, 1.1634521484375, 1.393798828125, 1.6241455078125, 1.8544921875, 2.0848388671875, 2.315185546875, 2.5455322265625, 2.77587890625, 3.0062255859375, 3.236572265625, 3.4669189453125, 3.697265625, 3.9276123046875, 4.157958984375, 4.3883056640625, 4.61865234375, 4.8489990234375, 5.079345703125, 5.3096923828125, 5.5400390625, 5.7703857421875, 6.000732421875, 6.2310791015625, 6.46142578125, 6.6917724609375, 6.922119140625, 7.1524658203125, 7.3828125]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 2.0, 10.0, 7.0, 8.0, 14.0, 8.0, 13.0, 26.0, 31.0, 40.0, 39.0, 65.0, 58.0, 81.0, 110.0, 172.0, 216.0, 288.0, 411.0, 547.0, 1196.0, 2805.0, 9197.0, 36095.0, 505895.0, 441567.0, 34762.0, 8871.0, 2699.0, 1095.0, 584.0, 402.0, 293.0, 254.0, 156.0, 126.0, 101.0, 84.0, 58.0, 36.0, 34.0, 23.0, 18.0, 14.0, 14.0, 6.0, 10.0, 5.0, 2.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-18.515625, -17.936767578125, -17.35791015625, -16.779052734375, -16.2001953125, -15.621337890625, -15.04248046875, -14.463623046875, -13.884765625, -13.305908203125, -12.72705078125, -12.148193359375, -11.5693359375, -10.990478515625, -10.41162109375, -9.832763671875, -9.25390625, -8.675048828125, -8.09619140625, -7.517333984375, -6.9384765625, -6.359619140625, -5.78076171875, -5.201904296875, -4.623046875, -4.044189453125, -3.46533203125, -2.886474609375, -2.3076171875, -1.728759765625, -1.14990234375, -0.571044921875, 0.0078125, 0.586669921875, 1.16552734375, 1.744384765625, 2.3232421875, 2.902099609375, 3.48095703125, 4.059814453125, 4.638671875, 5.217529296875, 5.79638671875, 6.375244140625, 6.9541015625, 7.532958984375, 8.11181640625, 8.690673828125, 9.26953125, 9.848388671875, 10.42724609375, 11.006103515625, 11.5849609375, 12.163818359375, 12.74267578125, 13.321533203125, 13.900390625, 14.479248046875, 15.05810546875, 15.636962890625, 16.2158203125, 16.794677734375, 17.37353515625, 17.952392578125, 18.53125]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 5.0, 6.0, 8.0, 9.0, 10.0, 13.0, 10.0, 21.0, 19.0, 16.0, 25.0, 29.0, 22.0, 33.0, 37.0, 38.0, 42.0, 47.0, 62.0, 99.0, 1701.0, 273.0, 78.0, 63.0, 41.0, 49.0, 38.0, 29.0, 29.0, 35.0, 23.0, 19.0, 23.0, 15.0, 18.0, 5.0, 8.0, 8.0, 8.0, 4.0, 7.0, 7.0, 6.0, 1.0, 2.0, 1.0, 4.0, 1.0, 4.0, 0.0, 0.0, 1.0], "bins": [-20.390625, -19.768798828125, -19.14697265625, -18.525146484375, -17.9033203125, -17.281494140625, -16.65966796875, -16.037841796875, -15.416015625, -14.794189453125, -14.17236328125, -13.550537109375, -12.9287109375, -12.306884765625, -11.68505859375, -11.063232421875, -10.44140625, -9.819580078125, -9.19775390625, -8.575927734375, -7.9541015625, -7.332275390625, -6.71044921875, -6.088623046875, -5.466796875, -4.844970703125, -4.22314453125, -3.601318359375, -2.9794921875, -2.357666015625, -1.73583984375, -1.114013671875, -0.4921875, 0.129638671875, 0.75146484375, 1.373291015625, 1.9951171875, 2.616943359375, 3.23876953125, 3.860595703125, 4.482421875, 5.104248046875, 5.72607421875, 6.347900390625, 6.9697265625, 7.591552734375, 8.21337890625, 8.835205078125, 9.45703125, 10.078857421875, 10.70068359375, 11.322509765625, 11.9443359375, 12.566162109375, 13.18798828125, 13.809814453125, 14.431640625, 15.053466796875, 15.67529296875, 16.297119140625, 16.9189453125, 17.540771484375, 18.16259765625, 18.784423828125, 19.40625]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 1.0, 5.0, 5.0, 5.0, 6.0, 9.0, 11.0, 10.0, 6.0, 13.0, 19.0, 23.0, 28.0, 22.0, 25.0, 35.0, 51.0, 67.0, 78.0, 128.0, 225.0, 515.0, 3182.0, 113264.0, 3013563.0, 12496.0, 967.0, 317.0, 174.0, 82.0, 65.0, 52.0, 38.0, 33.0, 37.0, 26.0, 22.0, 20.0, 16.0, 19.0, 10.0, 7.0, 8.0, 5.0, 6.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-53.96875, -52.24072265625, -50.5126953125, -48.78466796875, -47.056640625, -45.32861328125, -43.6005859375, -41.87255859375, -40.14453125, -38.41650390625, -36.6884765625, -34.96044921875, -33.232421875, -31.50439453125, -29.7763671875, -28.04833984375, -26.3203125, -24.59228515625, -22.8642578125, -21.13623046875, -19.408203125, -17.68017578125, -15.9521484375, -14.22412109375, -12.49609375, -10.76806640625, -9.0400390625, -7.31201171875, -5.583984375, -3.85595703125, -2.1279296875, -0.39990234375, 1.328125, 3.05615234375, 4.7841796875, 6.51220703125, 8.240234375, 9.96826171875, 11.6962890625, 13.42431640625, 15.15234375, 16.88037109375, 18.6083984375, 20.33642578125, 22.064453125, 23.79248046875, 25.5205078125, 27.24853515625, 28.9765625, 30.70458984375, 32.4326171875, 34.16064453125, 35.888671875, 37.61669921875, 39.3447265625, 41.07275390625, 42.80078125, 44.52880859375, 46.2568359375, 47.98486328125, 49.712890625, 51.44091796875, 53.1689453125, 54.89697265625, 56.625]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 13.0, 66.0, 207.0, 353.0, 258.0, 88.0, 19.0, 7.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-77.25318908691406, -75.3061752319336, -73.35916900634766, -71.41215515136719, -69.46514892578125, -67.51813507080078, -65.57112884521484, -63.624114990234375, -61.67710876464844, -59.730098724365234, -57.78308868408203, -55.83607864379883, -53.889068603515625, -51.94205856323242, -49.99504852294922, -48.04803466796875, -46.10102462768555, -44.154014587402344, -42.20700454711914, -40.25999450683594, -38.312984466552734, -36.36597442626953, -34.41896057128906, -32.471954345703125, -30.52494239807129, -28.577932357788086, -26.630922317504883, -24.683910369873047, -22.736900329589844, -20.78989028930664, -18.842880249023438, -16.895870208740234, -14.948856353759766, -13.001846313476562, -11.05483627319336, -9.10782527923584, -7.160815238952637, -5.213805198669434, -3.266794204711914, -1.319784164428711, 0.6272258758544922, 2.5742361545562744, 4.521246433258057, 6.468256950378418, 8.415266990661621, 10.362277030944824, 12.309288024902344, 14.256298065185547, 16.20330810546875, 18.150318145751953, 20.097328186035156, 22.04433822631836, 23.991348266601562, 25.938358306884766, 27.8853702545166, 29.832380294799805, 31.779390335083008, 33.726402282714844, 35.67341232299805, 37.62042236328125, 39.56743240356445, 41.514442443847656, 43.46145248413086, 45.40846252441406, 47.355472564697266]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 6.0, 8.0, 1.0, 8.0, 7.0, 6.0, 20.0, 14.0, 17.0, 21.0, 26.0, 26.0, 31.0, 41.0, 35.0, 47.0, 37.0, 61.0, 42.0, 47.0, 51.0, 42.0, 32.0, 40.0, 44.0, 44.0, 34.0, 37.0, 37.0, 23.0, 17.0, 15.0, 19.0, 10.0, 19.0, 12.0, 4.0, 5.0, 6.0, 7.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-61.02687072753906, -59.1953239440918, -57.3637809753418, -55.53223419189453, -53.700687408447266, -51.869140625, -50.03759765625, -48.206050872802734, -46.37450408935547, -44.5429573059082, -42.7114143371582, -40.87986755371094, -39.04832077026367, -37.216773986816406, -35.385231018066406, -33.55368423461914, -31.72214126586914, -29.890596389770508, -28.059049606323242, -26.22750473022461, -24.395957946777344, -22.56441307067871, -20.732868194580078, -18.901321411132812, -17.06977653503418, -15.23823070526123, -13.406684875488281, -11.575139999389648, -9.7435941696167, -7.91204833984375, -6.080503463745117, -4.248957633972168, -2.4174118041992188, -0.5858662128448486, 1.2456793785095215, 3.0772247314453125, 4.908770561218262, 6.740316390991211, 8.571861267089844, 10.403407096862793, 12.234952926635742, 14.066498756408691, 15.89804458618164, 17.729589462280273, 19.561134338378906, 21.392681121826172, 23.224225997924805, 25.055770874023438, 26.887317657470703, 28.718862533569336, 30.5504093170166, 32.381954193115234, 34.2135009765625, 36.0450439453125, 37.876590728759766, 39.70813751220703, 41.53968048095703, 43.3712272644043, 45.2027702331543, 47.03431701660156, 48.86586380004883, 50.697410583496094, 52.528953552246094, 54.36050033569336, 56.192047119140625]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 1.0, 4.0, 4.0, 2.0, 8.0, 11.0, 9.0, 12.0, 16.0, 18.0, 16.0, 23.0, 19.0, 22.0, 28.0, 26.0, 20.0, 29.0, 41.0, 34.0, 43.0, 46.0, 39.0, 42.0, 44.0, 34.0, 46.0, 41.0, 38.0, 35.0, 43.0, 34.0, 10.0, 26.0, 24.0, 23.0, 20.0, 17.0, 11.0, 14.0, 7.0, 5.0, 3.0, 4.0, 1.0, 9.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0], "bins": [-7.828125, -7.58636474609375, -7.3446044921875, -7.10284423828125, -6.861083984375, -6.61932373046875, -6.3775634765625, -6.13580322265625, -5.89404296875, -5.65228271484375, -5.4105224609375, -5.16876220703125, -4.927001953125, -4.68524169921875, -4.4434814453125, -4.20172119140625, -3.9599609375, -3.71820068359375, -3.4764404296875, -3.23468017578125, -2.992919921875, -2.75115966796875, -2.5093994140625, -2.26763916015625, -2.02587890625, -1.78411865234375, -1.5423583984375, -1.30059814453125, -1.058837890625, -0.81707763671875, -0.5753173828125, -0.33355712890625, -0.091796875, 0.14996337890625, 0.3917236328125, 0.63348388671875, 0.875244140625, 1.11700439453125, 1.3587646484375, 1.60052490234375, 1.84228515625, 2.08404541015625, 2.3258056640625, 2.56756591796875, 2.809326171875, 3.05108642578125, 3.2928466796875, 3.53460693359375, 3.7763671875, 4.01812744140625, 4.2598876953125, 4.50164794921875, 4.743408203125, 4.98516845703125, 5.2269287109375, 5.46868896484375, 5.71044921875, 5.95220947265625, 6.1939697265625, 6.43572998046875, 6.677490234375, 6.91925048828125, 7.1610107421875, 7.40277099609375, 7.64453125]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 3.0, 4.0, 5.0, 12.0, 10.0, 17.0, 8.0, 16.0, 24.0, 29.0, 44.0, 58.0, 94.0, 104.0, 160.0, 283.0, 433.0, 759.0, 1369.0, 2700.0, 6098.0, 14870.0, 49043.0, 328152.0, 2165501.0, 1399109.0, 172450.0, 32382.0, 10983.0, 4507.0, 2242.0, 1089.0, 643.0, 375.0, 205.0, 145.0, 78.0, 74.0, 52.0, 35.0, 25.0, 22.0, 19.0, 20.0, 13.0, 7.0, 4.0, 2.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0], "bins": [-15.796875, -15.31591796875, -14.8349609375, -14.35400390625, -13.873046875, -13.39208984375, -12.9111328125, -12.43017578125, -11.94921875, -11.46826171875, -10.9873046875, -10.50634765625, -10.025390625, -9.54443359375, -9.0634765625, -8.58251953125, -8.1015625, -7.62060546875, -7.1396484375, -6.65869140625, -6.177734375, -5.69677734375, -5.2158203125, -4.73486328125, -4.25390625, -3.77294921875, -3.2919921875, -2.81103515625, -2.330078125, -1.84912109375, -1.3681640625, -0.88720703125, -0.40625, 0.07470703125, 0.5556640625, 1.03662109375, 1.517578125, 1.99853515625, 2.4794921875, 2.96044921875, 3.44140625, 3.92236328125, 4.4033203125, 4.88427734375, 5.365234375, 5.84619140625, 6.3271484375, 6.80810546875, 7.2890625, 7.77001953125, 8.2509765625, 8.73193359375, 9.212890625, 9.69384765625, 10.1748046875, 10.65576171875, 11.13671875, 11.61767578125, 12.0986328125, 12.57958984375, 13.060546875, 13.54150390625, 14.0224609375, 14.50341796875, 14.984375]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 5.0, 5.0, 13.0, 15.0, 29.0, 34.0, 38.0, 81.0, 100.0, 181.0, 244.0, 377.0, 565.0, 653.0, 601.0, 391.0, 229.0, 157.0, 116.0, 91.0, 50.0, 32.0, 21.0, 20.0, 10.0, 13.0, 7.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-15.671875, -15.139892578125, -14.60791015625, -14.075927734375, -13.5439453125, -13.011962890625, -12.47998046875, -11.947998046875, -11.416015625, -10.884033203125, -10.35205078125, -9.820068359375, -9.2880859375, -8.756103515625, -8.22412109375, -7.692138671875, -7.16015625, -6.628173828125, -6.09619140625, -5.564208984375, -5.0322265625, -4.500244140625, -3.96826171875, -3.436279296875, -2.904296875, -2.372314453125, -1.84033203125, -1.308349609375, -0.7763671875, -0.244384765625, 0.28759765625, 0.819580078125, 1.3515625, 1.883544921875, 2.41552734375, 2.947509765625, 3.4794921875, 4.011474609375, 4.54345703125, 5.075439453125, 5.607421875, 6.139404296875, 6.67138671875, 7.203369140625, 7.7353515625, 8.267333984375, 8.79931640625, 9.331298828125, 9.86328125, 10.395263671875, 10.92724609375, 11.459228515625, 11.9912109375, 12.523193359375, 13.05517578125, 13.587158203125, 14.119140625, 14.651123046875, 15.18310546875, 15.715087890625, 16.2470703125, 16.779052734375, 17.31103515625, 17.843017578125, 18.375]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 8.0, 8.0, 8.0, 14.0, 22.0, 35.0, 59.0, 54.0, 74.0, 135.0, 177.0, 264.0, 528.0, 1547.0, 8580.0, 121150.0, 3734941.0, 307272.0, 15544.0, 2288.0, 683.0, 327.0, 177.0, 130.0, 75.0, 53.0, 32.0, 30.0, 26.0, 15.0, 7.0, 10.0, 7.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.84375, -44.48046875, -43.1171875, -41.75390625, -40.390625, -39.02734375, -37.6640625, -36.30078125, -34.9375, -33.57421875, -32.2109375, -30.84765625, -29.484375, -28.12109375, -26.7578125, -25.39453125, -24.03125, -22.66796875, -21.3046875, -19.94140625, -18.578125, -17.21484375, -15.8515625, -14.48828125, -13.125, -11.76171875, -10.3984375, -9.03515625, -7.671875, -6.30859375, -4.9453125, -3.58203125, -2.21875, -0.85546875, 0.5078125, 1.87109375, 3.234375, 4.59765625, 5.9609375, 7.32421875, 8.6875, 10.05078125, 11.4140625, 12.77734375, 14.140625, 15.50390625, 16.8671875, 18.23046875, 19.59375, 20.95703125, 22.3203125, 23.68359375, 25.046875, 26.41015625, 27.7734375, 29.13671875, 30.5, 31.86328125, 33.2265625, 34.58984375, 35.953125, 37.31640625, 38.6796875, 40.04296875, 41.40625]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 15.0, 67.0, 247.0, 389.0, 209.0, 66.0, 14.0, 1.0, 0.0, 0.0, 1.0], "bins": [-306.80279541015625, -301.35601806640625, -295.90924072265625, -290.46246337890625, -285.01568603515625, -279.56890869140625, -274.12213134765625, -268.67535400390625, -263.22857666015625, -257.78179931640625, -252.33502197265625, -246.88824462890625, -241.44146728515625, -235.9946746826172, -230.5478973388672, -225.1011199951172, -219.65432739257812, -214.20755004882812, -208.76077270507812, -203.31399536132812, -197.86721801757812, -192.42042541503906, -186.97364807128906, -181.52687072753906, -176.08009338378906, -170.63331604003906, -165.18653869628906, -159.73976135253906, -154.29296875, -148.84619140625, -143.3994140625, -137.95263671875, -132.505859375, -127.05908203125, -121.6123046875, -116.16551971435547, -110.71874237060547, -105.27196502685547, -99.82518005371094, -94.37840270996094, -88.9316177368164, -83.4848403930664, -78.03805541992188, -72.59127807617188, -67.14450073242188, -61.697723388671875, -56.25094223022461, -50.804161071777344, -45.357383728027344, -39.910606384277344, -34.46382522583008, -29.017045974731445, -23.570266723632812, -18.12348747253418, -12.676708221435547, -7.229927062988281, -1.7831497192382812, 3.6636295318603516, 9.110408782958984, 14.557188034057617, 20.00396728515625, 25.450746536254883, 30.897525787353516, 36.34430694580078, 41.79108428955078]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 10.0, 8.0, 2.0, 12.0, 7.0, 13.0, 16.0, 20.0, 17.0, 23.0, 18.0, 20.0, 25.0, 27.0, 36.0, 48.0, 35.0, 30.0, 39.0, 34.0, 44.0, 39.0, 42.0, 27.0, 40.0, 30.0, 31.0, 34.0, 27.0, 33.0, 30.0, 25.0, 31.0, 18.0, 16.0, 11.0, 12.0, 17.0, 5.0, 17.0, 5.0, 13.0, 7.0, 4.0, 4.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-38.7432861328125, -37.51582336425781, -36.288360595703125, -35.06089782714844, -33.83343505859375, -32.60597229003906, -31.378511428833008, -30.15104866027832, -28.923585891723633, -27.696123123168945, -26.468660354614258, -25.24119758605957, -24.013736724853516, -22.786273956298828, -21.55881118774414, -20.331348419189453, -19.103885650634766, -17.876422882080078, -16.64896011352539, -15.42149829864502, -14.194035530090332, -12.966572761535645, -11.739110946655273, -10.511648178100586, -9.284185409545898, -8.056722640991211, -6.829260349273682, -5.601798057556152, -4.374335289001465, -3.1468725204467773, -1.919410228729248, -0.6919479370117188, 0.5355148315429688, 1.7629773616790771, 2.9904398918151855, 4.217902183532715, 5.445364952087402, 6.67282772064209, 7.900290012359619, 9.127752304077148, 10.355215072631836, 11.582677841186523, 12.810140609741211, 14.037602424621582, 15.26506519317627, 16.49252700805664, 17.719989776611328, 18.947452545166016, 20.174915313720703, 21.40237808227539, 22.629840850830078, 23.857303619384766, 25.084766387939453, 26.31222915649414, 27.539690017700195, 28.767152786254883, 29.99461555480957, 31.222078323364258, 32.44953918457031, 33.677001953125, 34.90446472167969, 36.131927490234375, 37.35939025878906, 38.58685302734375, 39.81431579589844]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 5.0, 3.0, 8.0, 5.0, 16.0, 11.0, 8.0, 12.0, 18.0, 14.0, 17.0, 21.0, 32.0, 27.0, 40.0, 29.0, 41.0, 38.0, 33.0, 34.0, 40.0, 30.0, 41.0, 51.0, 42.0, 44.0, 27.0, 47.0, 26.0, 30.0, 30.0, 23.0, 15.0, 22.0, 20.0, 23.0, 12.0, 9.0, 10.0, 11.0, 9.0, 6.0, 4.0, 8.0, 2.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-8.6328125, -8.37945556640625, -8.1260986328125, -7.87274169921875, -7.619384765625, -7.36602783203125, -7.1126708984375, -6.85931396484375, -6.60595703125, -6.35260009765625, -6.0992431640625, -5.84588623046875, -5.592529296875, -5.33917236328125, -5.0858154296875, -4.83245849609375, -4.5791015625, -4.32574462890625, -4.0723876953125, -3.81903076171875, -3.565673828125, -3.31231689453125, -3.0589599609375, -2.80560302734375, -2.55224609375, -2.29888916015625, -2.0455322265625, -1.79217529296875, -1.538818359375, -1.28546142578125, -1.0321044921875, -0.77874755859375, -0.525390625, -0.27203369140625, -0.0186767578125, 0.23468017578125, 0.488037109375, 0.74139404296875, 0.9947509765625, 1.24810791015625, 1.50146484375, 1.75482177734375, 2.0081787109375, 2.26153564453125, 2.514892578125, 2.76824951171875, 3.0216064453125, 3.27496337890625, 3.5283203125, 3.78167724609375, 4.0350341796875, 4.28839111328125, 4.541748046875, 4.79510498046875, 5.0484619140625, 5.30181884765625, 5.55517578125, 5.80853271484375, 6.0618896484375, 6.31524658203125, 6.568603515625, 6.82196044921875, 7.0753173828125, 7.32867431640625, 7.58203125]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 2.0, 9.0, 15.0, 26.0, 45.0, 58.0, 78.0, 123.0, 201.0, 297.0, 462.0, 714.0, 1127.0, 1764.0, 2649.0, 4109.0, 6392.0, 9966.0, 15626.0, 24178.0, 37751.0, 58858.0, 89771.0, 130651.0, 166749.0, 158209.0, 117265.0, 78659.0, 51227.0, 32562.0, 21060.0, 13167.0, 8845.0, 5528.0, 3688.0, 2421.0, 1538.0, 967.0, 653.0, 394.0, 248.0, 188.0, 114.0, 79.0, 45.0, 26.0, 24.0, 6.0, 10.0, 5.0, 3.0, 3.0, 1.0, 1.0, 3.0, 1.0], "bins": [-0.7431640625, -0.7205352783203125, -0.697906494140625, -0.6752777099609375, -0.65264892578125, -0.6300201416015625, -0.607391357421875, -0.5847625732421875, -0.5621337890625, -0.5395050048828125, -0.516876220703125, -0.4942474365234375, -0.47161865234375, -0.4489898681640625, -0.426361083984375, -0.4037322998046875, -0.381103515625, -0.3584747314453125, -0.335845947265625, -0.3132171630859375, -0.29058837890625, -0.2679595947265625, -0.245330810546875, -0.2227020263671875, -0.2000732421875, -0.1774444580078125, -0.154815673828125, -0.1321868896484375, -0.10955810546875, -0.0869293212890625, -0.064300537109375, -0.0416717529296875, -0.01904296875, 0.0035858154296875, 0.026214599609375, 0.0488433837890625, 0.07147216796875, 0.0941009521484375, 0.116729736328125, 0.1393585205078125, 0.1619873046875, 0.1846160888671875, 0.207244873046875, 0.2298736572265625, 0.25250244140625, 0.2751312255859375, 0.297760009765625, 0.3203887939453125, 0.343017578125, 0.3656463623046875, 0.388275146484375, 0.4109039306640625, 0.43353271484375, 0.4561614990234375, 0.478790283203125, 0.5014190673828125, 0.5240478515625, 0.5466766357421875, 0.569305419921875, 0.5919342041015625, 0.61456298828125, 0.6371917724609375, 0.659820556640625, 0.6824493408203125, 0.705078125]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 7.0, 2.0, 4.0, 1.0, 4.0, 4.0, 6.0, 7.0, 6.0, 7.0, 13.0, 9.0, 13.0, 21.0, 22.0, 23.0, 25.0, 30.0, 26.0, 34.0, 38.0, 39.0, 46.0, 47.0, 43.0, 45.0, 1052.0, 31.0, 41.0, 31.0, 33.0, 35.0, 47.0, 36.0, 26.0, 33.0, 22.0, 19.0, 20.0, 22.0, 16.0, 5.0, 10.0, 8.0, 7.0, 6.0, 4.0, 2.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.08984375, -4.92645263671875, -4.7630615234375, -4.59967041015625, -4.436279296875, -4.27288818359375, -4.1094970703125, -3.94610595703125, -3.78271484375, -3.61932373046875, -3.4559326171875, -3.29254150390625, -3.129150390625, -2.96575927734375, -2.8023681640625, -2.63897705078125, -2.4755859375, -2.31219482421875, -2.1488037109375, -1.98541259765625, -1.822021484375, -1.65863037109375, -1.4952392578125, -1.33184814453125, -1.16845703125, -1.00506591796875, -0.8416748046875, -0.67828369140625, -0.514892578125, -0.35150146484375, -0.1881103515625, -0.02471923828125, 0.138671875, 0.30206298828125, 0.4654541015625, 0.62884521484375, 0.792236328125, 0.95562744140625, 1.1190185546875, 1.28240966796875, 1.44580078125, 1.60919189453125, 1.7725830078125, 1.93597412109375, 2.099365234375, 2.26275634765625, 2.4261474609375, 2.58953857421875, 2.7529296875, 2.91632080078125, 3.0797119140625, 3.24310302734375, 3.406494140625, 3.56988525390625, 3.7332763671875, 3.89666748046875, 4.06005859375, 4.22344970703125, 4.3868408203125, 4.55023193359375, 4.713623046875, 4.87701416015625, 5.0404052734375, 5.20379638671875, 5.3671875]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 2.0, 5.0, 9.0, 13.0, 18.0, 35.0, 50.0, 75.0, 116.0, 186.0, 310.0, 522.0, 791.0, 1247.0, 1966.0, 3072.0, 4876.0, 7759.0, 12293.0, 19653.0, 30545.0, 48623.0, 74060.0, 109091.0, 145952.0, 1209332.0, 138691.0, 101158.0, 67319.0, 43447.0, 27722.0, 17804.0, 11105.0, 7083.0, 4377.0, 2895.0, 1831.0, 1149.0, 702.0, 469.0, 290.0, 171.0, 123.0, 78.0, 48.0, 27.0, 15.0, 9.0, 9.0, 5.0, 1.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.63330078125, -0.6137466430664062, -0.5941925048828125, -0.5746383666992188, -0.555084228515625, -0.5355300903320312, -0.5159759521484375, -0.49642181396484375, -0.47686767578125, -0.45731353759765625, -0.4377593994140625, -0.41820526123046875, -0.398651123046875, -0.37909698486328125, -0.3595428466796875, -0.33998870849609375, -0.3204345703125, -0.30088043212890625, -0.2813262939453125, -0.26177215576171875, -0.242218017578125, -0.22266387939453125, -0.2031097412109375, -0.18355560302734375, -0.16400146484375, -0.14444732666015625, -0.1248931884765625, -0.10533905029296875, -0.085784912109375, -0.06623077392578125, -0.0466766357421875, -0.02712249755859375, -0.007568359375, 0.01198577880859375, 0.0315399169921875, 0.05109405517578125, 0.070648193359375, 0.09020233154296875, 0.1097564697265625, 0.12931060791015625, 0.14886474609375, 0.16841888427734375, 0.1879730224609375, 0.20752716064453125, 0.227081298828125, 0.24663543701171875, 0.2661895751953125, 0.28574371337890625, 0.3052978515625, 0.32485198974609375, 0.3444061279296875, 0.36396026611328125, 0.383514404296875, 0.40306854248046875, 0.4226226806640625, 0.44217681884765625, 0.46173095703125, 0.48128509521484375, 0.5008392333984375, 0.5203933715820312, 0.539947509765625, 0.5595016479492188, 0.5790557861328125, 0.5986099243164062, 0.6181640625]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 7.0, 4.0, 6.0, 6.0, 5.0, 7.0, 7.0, 14.0, 23.0, 32.0, 44.0, 54.0, 60.0, 73.0, 85.0, 91.0, 81.0, 84.0, 58.0, 68.0, 58.0, 36.0, 32.0, 17.0, 17.0, 15.0, 7.0, 5.0, 1.0, 6.0, 3.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00699615478515625, -0.006795704364776611, -0.006595253944396973, -0.006394803524017334, -0.006194353103637695, -0.005993902683258057, -0.005793452262878418, -0.005593001842498779, -0.005392551422119141, -0.005192101001739502, -0.004991650581359863, -0.004791200160980225, -0.004590749740600586, -0.004390299320220947, -0.004189848899841309, -0.00398939847946167, -0.0037889480590820312, -0.0035884976387023926, -0.003388047218322754, -0.0031875967979431152, -0.0029871463775634766, -0.002786695957183838, -0.0025862455368041992, -0.0023857951164245605, -0.002185344696044922, -0.001984894275665283, -0.0017844438552856445, -0.0015839934349060059, -0.0013835430145263672, -0.0011830925941467285, -0.0009826421737670898, -0.0007821917533874512, -0.0005817413330078125, -0.00038129091262817383, -0.00018084049224853516, 1.9609928131103516e-05, 0.0002200603485107422, 0.00042051076889038086, 0.0006209611892700195, 0.0008214116096496582, 0.0010218620300292969, 0.0012223124504089355, 0.0014227628707885742, 0.0016232132911682129, 0.0018236637115478516, 0.0020241141319274902, 0.002224564552307129, 0.0024250149726867676, 0.0026254653930664062, 0.002825915813446045, 0.0030263662338256836, 0.0032268166542053223, 0.003427267074584961, 0.0036277174949645996, 0.0038281679153442383, 0.004028618335723877, 0.004229068756103516, 0.004429519176483154, 0.004629969596862793, 0.004830420017242432, 0.00503087043762207, 0.005231320858001709, 0.005431771278381348, 0.005632221698760986, 0.005832672119140625]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 3.0, 5.0, 14.0, 13.0, 7.0, 25.0, 29.0, 34.0, 66.0, 82.0, 149.0, 165.0, 329.0, 803.0, 60574.0, 983653.0, 1463.0, 432.0, 224.0, 149.0, 100.0, 72.0, 36.0, 31.0, 21.0, 14.0, 10.0, 16.0, 7.0, 7.0, 6.0, 3.0, 5.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11328125, -0.10939979553222656, -0.10551834106445312, -0.10163688659667969, -0.09775543212890625, -0.09387397766113281, -0.08999252319335938, -0.08611106872558594, -0.0822296142578125, -0.07834815979003906, -0.07446670532226562, -0.07058525085449219, -0.06670379638671875, -0.06282234191894531, -0.058940887451171875, -0.05505943298339844, -0.051177978515625, -0.04729652404785156, -0.043415069580078125, -0.03953361511230469, -0.03565216064453125, -0.03177070617675781, -0.027889251708984375, -0.024007797241210938, -0.0201263427734375, -0.016244888305664062, -0.012363433837890625, -0.008481979370117188, -0.00460052490234375, -0.0007190704345703125, 0.003162384033203125, 0.0070438385009765625, 0.01092529296875, 0.014806747436523438, 0.018688201904296875, 0.022569656372070312, 0.02645111083984375, 0.030332565307617188, 0.034214019775390625, 0.03809547424316406, 0.0419769287109375, 0.04585838317871094, 0.049739837646484375, 0.05362129211425781, 0.05750274658203125, 0.06138420104980469, 0.06526565551757812, 0.06914710998535156, 0.073028564453125, 0.07691001892089844, 0.08079147338867188, 0.08467292785644531, 0.08855438232421875, 0.09243583679199219, 0.09631729125976562, 0.10019874572753906, 0.1040802001953125, 0.10796165466308594, 0.11184310913085938, 0.11572456359863281, 0.11960601806640625, 0.12348747253417969, 0.12736892700195312, 0.13125038146972656, 0.1351318359375]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 268.0, 748.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06338192522525787, -0.061718348413705826, -0.06005476787686348, -0.05839119106531143, -0.056727610528469086, -0.05506403371691704, -0.05340045690536499, -0.051736876368522644, -0.0500732958316803, -0.04840971902012825, -0.046746138483285904, -0.045082561671733856, -0.04341898113489151, -0.04175540432333946, -0.040091827511787415, -0.03842824697494507, -0.03676467016339302, -0.03510109335184097, -0.03343751281499863, -0.03177393600344658, -0.030110355466604233, -0.028446778655052185, -0.026783199980854988, -0.02511962130665779, -0.023456042632460594, -0.021792463958263397, -0.0201288852840662, -0.018465306609869003, -0.016801729798316956, -0.015138150192797184, -0.013474572449922562, -0.011810993775725365, -0.010147418826818466, -0.00848384015262127, -0.00682026194408536, -0.00515668373554945, -0.003493105061352253, -0.001829526387155056, -0.00016594864428043365, 0.0014976300299167633, 0.0031612087041139603, 0.004824787378311157, 0.006488365586847067, 0.008151943795382977, 0.009815522469580173, 0.01147910114377737, 0.013142678886651993, 0.01480625756084919, 0.016469836235046387, 0.018133414909243584, 0.01979699358344078, 0.02146057039499283, 0.023124150931835175, 0.024787727743387222, 0.02645130641758442, 0.028114885091781616, 0.029778463765978813, 0.03144204244017601, 0.03310561925172806, 0.034769199788570404, 0.03643277660012245, 0.0380963571369648, 0.039759933948516846, 0.04142351448535919, 0.04308709129691124]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 2.0, 4.0, 10.0, 13.0, 14.0, 13.0, 23.0, 27.0, 28.0, 33.0, 23.0, 26.0, 39.0, 35.0, 37.0, 45.0, 52.0, 52.0, 41.0, 54.0, 51.0, 47.0, 44.0, 49.0, 37.0, 30.0, 33.0, 34.0, 17.0, 19.0, 15.0, 19.0, 13.0, 8.0, 3.0, 5.0, 3.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0024068355560302734, -0.002306555397808552, -0.00220627523958683, -0.0021059950813651085, -0.002005714923143387, -0.0019054347649216652, -0.0018051546066999435, -0.001704874448478222, -0.0016045942902565002, -0.0015043141320347786, -0.001404033973813057, -0.0013037538155913353, -0.0012034736573696136, -0.001103193499147892, -0.0010029133409261703, -0.0009026331827044487, -0.000802353024482727, -0.0007020728662610054, -0.0006017927080392838, -0.0005015125498175621, -0.00040123239159584045, -0.0003009522333741188, -0.00020067207515239716, -0.0001003919169306755, -1.1175870895385742e-07, 0.00010016839951276779, 0.00020044855773448944, 0.0003007287159562111, 0.00040100887417793274, 0.0005012890323996544, 0.000601569190621376, 0.0007018493488430977, 0.0008021295070648193, 0.000902409665286541, 0.0010026898235082626, 0.0011029699817299843, 0.001203250139951706, 0.0013035302981734276, 0.0014038104563951492, 0.0015040906146168709, 0.0016043707728385925, 0.0017046509310603142, 0.0018049310892820358, 0.0019052112475037575, 0.002005491405725479, 0.0021057715639472008, 0.0022060517221689224, 0.002306331880390644, 0.0024066120386123657, 0.0025068921968340874, 0.002607172355055809, 0.0027074525132775307, 0.0028077326714992523, 0.002908012829720974, 0.0030082929879426956, 0.0031085731461644173, 0.003208853304386139, 0.0033091334626078606, 0.003409413620829582, 0.003509693779051304, 0.0036099739372730255, 0.003710254095494747, 0.003810534253716469, 0.0039108144119381905, 0.004011094570159912]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 5.0, 3.0, 8.0, 5.0, 16.0, 11.0, 8.0, 12.0, 18.0, 14.0, 17.0, 21.0, 32.0, 27.0, 40.0, 29.0, 41.0, 38.0, 33.0, 34.0, 40.0, 30.0, 41.0, 51.0, 41.0, 45.0, 27.0, 47.0, 26.0, 30.0, 30.0, 23.0, 15.0, 22.0, 20.0, 23.0, 13.0, 8.0, 10.0, 11.0, 9.0, 6.0, 4.0, 8.0, 2.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-8.6328125, -8.37945556640625, -8.1260986328125, -7.87274169921875, -7.619384765625, -7.36602783203125, -7.1126708984375, -6.85931396484375, -6.60595703125, -6.35260009765625, -6.0992431640625, -5.84588623046875, -5.592529296875, -5.33917236328125, -5.0858154296875, -4.83245849609375, -4.5791015625, -4.32574462890625, -4.0723876953125, -3.81903076171875, -3.565673828125, -3.31231689453125, -3.0589599609375, -2.80560302734375, -2.55224609375, -2.29888916015625, -2.0455322265625, -1.79217529296875, -1.538818359375, -1.28546142578125, -1.0321044921875, -0.77874755859375, -0.525390625, -0.27203369140625, -0.0186767578125, 0.23468017578125, 0.488037109375, 0.74139404296875, 0.9947509765625, 1.24810791015625, 1.50146484375, 1.75482177734375, 2.0081787109375, 2.26153564453125, 2.514892578125, 2.76824951171875, 3.0216064453125, 3.27496337890625, 3.5283203125, 3.78167724609375, 4.0350341796875, 4.28839111328125, 4.541748046875, 4.79510498046875, 5.0484619140625, 5.30181884765625, 5.55517578125, 5.80853271484375, 6.0618896484375, 6.31524658203125, 6.568603515625, 6.82196044921875, 7.0753173828125, 7.32867431640625, 7.58203125]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 1.0, 3.0, 4.0, 7.0, 6.0, 11.0, 9.0, 13.0, 18.0, 32.0, 29.0, 44.0, 61.0, 66.0, 124.0, 158.0, 272.0, 449.0, 831.0, 1526.0, 3095.0, 6202.0, 13311.0, 29188.0, 69345.0, 198131.0, 457629.0, 160008.0, 59471.0, 25691.0, 11428.0, 5389.0, 2681.0, 1367.0, 733.0, 370.0, 272.0, 172.0, 114.0, 73.0, 50.0, 44.0, 22.0, 31.0, 24.0, 16.0, 12.0, 7.0, 9.0, 5.0, 5.0, 4.0, 2.0, 0.0, 0.0, 3.0], "bins": [-11.0859375, -10.7637939453125, -10.441650390625, -10.1195068359375, -9.79736328125, -9.4752197265625, -9.153076171875, -8.8309326171875, -8.5087890625, -8.1866455078125, -7.864501953125, -7.5423583984375, -7.22021484375, -6.8980712890625, -6.575927734375, -6.2537841796875, -5.931640625, -5.6094970703125, -5.287353515625, -4.9652099609375, -4.64306640625, -4.3209228515625, -3.998779296875, -3.6766357421875, -3.3544921875, -3.0323486328125, -2.710205078125, -2.3880615234375, -2.06591796875, -1.7437744140625, -1.421630859375, -1.0994873046875, -0.77734375, -0.4552001953125, -0.133056640625, 0.1890869140625, 0.51123046875, 0.8333740234375, 1.155517578125, 1.4776611328125, 1.7998046875, 2.1219482421875, 2.444091796875, 2.7662353515625, 3.08837890625, 3.4105224609375, 3.732666015625, 4.0548095703125, 4.376953125, 4.6990966796875, 5.021240234375, 5.3433837890625, 5.66552734375, 5.9876708984375, 6.309814453125, 6.6319580078125, 6.9541015625, 7.2762451171875, 7.598388671875, 7.9205322265625, 8.24267578125, 8.5648193359375, 8.886962890625, 9.2091064453125, 9.53125]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 6.0, 10.0, 10.0, 10.0, 9.0, 16.0, 17.0, 21.0, 27.0, 20.0, 31.0, 22.0, 37.0, 42.0, 43.0, 71.0, 82.0, 138.0, 1518.0, 336.0, 141.0, 70.0, 55.0, 40.0, 28.0, 33.0, 40.0, 21.0, 28.0, 23.0, 20.0, 6.0, 14.0, 11.0, 12.0, 9.0, 10.0, 5.0, 6.0, 4.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-23.40625, -22.6494140625, -21.892578125, -21.1357421875, -20.37890625, -19.6220703125, -18.865234375, -18.1083984375, -17.3515625, -16.5947265625, -15.837890625, -15.0810546875, -14.32421875, -13.5673828125, -12.810546875, -12.0537109375, -11.296875, -10.5400390625, -9.783203125, -9.0263671875, -8.26953125, -7.5126953125, -6.755859375, -5.9990234375, -5.2421875, -4.4853515625, -3.728515625, -2.9716796875, -2.21484375, -1.4580078125, -0.701171875, 0.0556640625, 0.8125, 1.5693359375, 2.326171875, 3.0830078125, 3.83984375, 4.5966796875, 5.353515625, 6.1103515625, 6.8671875, 7.6240234375, 8.380859375, 9.1376953125, 9.89453125, 10.6513671875, 11.408203125, 12.1650390625, 12.921875, 13.6787109375, 14.435546875, 15.1923828125, 15.94921875, 16.7060546875, 17.462890625, 18.2197265625, 18.9765625, 19.7333984375, 20.490234375, 21.2470703125, 22.00390625, 22.7607421875, 23.517578125, 24.2744140625, 25.03125]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 3.0, 4.0, 3.0, 7.0, 7.0, 10.0, 13.0, 19.0, 21.0, 28.0, 44.0, 50.0, 81.0, 102.0, 168.0, 248.0, 467.0, 1680.0, 19162.0, 1968957.0, 1135516.0, 16335.0, 1493.0, 491.0, 229.0, 161.0, 110.0, 79.0, 58.0, 38.0, 34.0, 25.0, 16.0, 15.0, 12.0, 2.0, 6.0, 6.0, 5.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-38.3125, -36.990234375, -35.66796875, -34.345703125, -33.0234375, -31.701171875, -30.37890625, -29.056640625, -27.734375, -26.412109375, -25.08984375, -23.767578125, -22.4453125, -21.123046875, -19.80078125, -18.478515625, -17.15625, -15.833984375, -14.51171875, -13.189453125, -11.8671875, -10.544921875, -9.22265625, -7.900390625, -6.578125, -5.255859375, -3.93359375, -2.611328125, -1.2890625, 0.033203125, 1.35546875, 2.677734375, 4.0, 5.322265625, 6.64453125, 7.966796875, 9.2890625, 10.611328125, 11.93359375, 13.255859375, 14.578125, 15.900390625, 17.22265625, 18.544921875, 19.8671875, 21.189453125, 22.51171875, 23.833984375, 25.15625, 26.478515625, 27.80078125, 29.123046875, 30.4453125, 31.767578125, 33.08984375, 34.412109375, 35.734375, 37.056640625, 38.37890625, 39.701171875, 41.0234375, 42.345703125, 43.66796875, 44.990234375, 46.3125]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 260.0, 748.0, 8.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-568.1582641601562, -556.3590087890625, -544.5596923828125, -532.7604370117188, -520.961181640625, -509.1618957519531, -497.36260986328125, -485.5633544921875, -473.76409912109375, -461.9648132324219, -450.1655578613281, -438.36627197265625, -426.5670166015625, -414.7677307128906, -402.96844482421875, -391.169189453125, -379.3699035644531, -367.57061767578125, -355.7713623046875, -343.9720764160156, -332.1728210449219, -320.37353515625, -308.57427978515625, -296.7749938964844, -284.9757080078125, -273.1764221191406, -261.3771667480469, -249.577880859375, -237.77862548828125, -225.97933959960938, -214.18006896972656, -202.38079833984375, -190.58151245117188, -178.78224182128906, -166.98297119140625, -155.18368530273438, -143.38442993164062, -131.58514404296875, -119.78587341308594, -107.98660278320312, -96.18733215332031, -84.3880615234375, -72.58879089355469, -60.789512634277344, -48.99024200439453, -37.19097137451172, -25.391693115234375, -13.592422485351562, -1.79315185546875, 10.006120681762695, 21.80539321899414, 33.60466766357422, 45.40393829345703, 57.203208923339844, 69.00248718261719, 80.8017578125, 92.60102844238281, 104.40029907226562, 116.19956970214844, 127.99884796142578, 139.79812622070312, 151.59738159179688, 163.39666748046875, 175.19593811035156, 186.99520874023438]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 2.0, 4.0, 8.0, 7.0, 0.0, 9.0, 8.0, 7.0, 17.0, 18.0, 16.0, 12.0, 15.0, 24.0, 21.0, 30.0, 23.0, 27.0, 26.0, 35.0, 28.0, 44.0, 33.0, 38.0, 30.0, 36.0, 30.0, 31.0, 38.0, 37.0, 48.0, 29.0, 23.0, 37.0, 31.0, 22.0, 25.0, 28.0, 14.0, 19.0, 10.0, 15.0, 7.0, 6.0, 6.0, 7.0, 7.0, 5.0, 4.0, 2.0, 5.0, 1.0, 7.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-41.95530700683594, -40.405799865722656, -38.856292724609375, -37.306785583496094, -35.75727844238281, -34.20777130126953, -32.65826416015625, -31.10875701904297, -29.559249877929688, -28.009742736816406, -26.460235595703125, -24.910728454589844, -23.361221313476562, -21.81171417236328, -20.26220703125, -18.71269989013672, -17.163192749023438, -15.613685607910156, -14.064178466796875, -12.514671325683594, -10.965164184570312, -9.415657043457031, -7.86614990234375, -6.316642761230469, -4.7671356201171875, -3.2176284790039062, -1.668121337890625, -0.11861419677734375, 1.4308929443359375, 2.9804000854492188, 4.5299072265625, 6.079414367675781, 7.6289215087890625, 9.178428649902344, 10.727935791015625, 12.277442932128906, 13.826950073242188, 15.376457214355469, 16.92596435546875, 18.47547149658203, 20.024978637695312, 21.574485778808594, 23.123992919921875, 24.673500061035156, 26.223007202148438, 27.77251434326172, 29.322021484375, 30.87152862548828, 32.42103576660156, 33.970542907714844, 35.520050048828125, 37.069557189941406, 38.61906433105469, 40.16857147216797, 41.71807861328125, 43.26758575439453, 44.81709289550781, 46.366600036621094, 47.916107177734375, 49.465614318847656, 51.01512145996094, 52.56462860107422, 54.1141357421875, 55.66364288330078, 57.21315002441406]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 5.0, 6.0, 4.0, 5.0, 8.0, 9.0, 18.0, 15.0, 10.0, 12.0, 21.0, 24.0, 21.0, 46.0, 34.0, 40.0, 46.0, 40.0, 26.0, 48.0, 28.0, 31.0, 47.0, 47.0, 52.0, 37.0, 36.0, 33.0, 27.0, 31.0, 33.0, 21.0, 30.0, 25.0, 16.0, 11.0, 7.0, 6.0, 6.0, 14.0, 4.0, 4.0, 7.0, 5.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.6484375, -8.375732421875, -8.10302734375, -7.830322265625, -7.5576171875, -7.284912109375, -7.01220703125, -6.739501953125, -6.466796875, -6.194091796875, -5.92138671875, -5.648681640625, -5.3759765625, -5.103271484375, -4.83056640625, -4.557861328125, -4.28515625, -4.012451171875, -3.73974609375, -3.467041015625, -3.1943359375, -2.921630859375, -2.64892578125, -2.376220703125, -2.103515625, -1.830810546875, -1.55810546875, -1.285400390625, -1.0126953125, -0.739990234375, -0.46728515625, -0.194580078125, 0.078125, 0.350830078125, 0.62353515625, 0.896240234375, 1.1689453125, 1.441650390625, 1.71435546875, 1.987060546875, 2.259765625, 2.532470703125, 2.80517578125, 3.077880859375, 3.3505859375, 3.623291015625, 3.89599609375, 4.168701171875, 4.44140625, 4.714111328125, 4.98681640625, 5.259521484375, 5.5322265625, 5.804931640625, 6.07763671875, 6.350341796875, 6.623046875, 6.895751953125, 7.16845703125, 7.441162109375, 7.7138671875, 7.986572265625, 8.25927734375, 8.531982421875, 8.8046875]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 7.0, 8.0, 9.0, 9.0, 13.0, 14.0, 18.0, 26.0, 47.0, 73.0, 119.0, 211.0, 379.0, 831.0, 1678.0, 4016.0, 10589.0, 36519.0, 281811.0, 2475834.0, 1247579.0, 101924.0, 20492.0, 6864.0, 2772.0, 1161.0, 576.0, 285.0, 162.0, 69.0, 56.0, 28.0, 28.0, 21.0, 9.0, 5.0, 10.0, 8.0, 6.0, 5.0, 5.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.21875, -17.607177734375, -16.99560546875, -16.384033203125, -15.7724609375, -15.160888671875, -14.54931640625, -13.937744140625, -13.326171875, -12.714599609375, -12.10302734375, -11.491455078125, -10.8798828125, -10.268310546875, -9.65673828125, -9.045166015625, -8.43359375, -7.822021484375, -7.21044921875, -6.598876953125, -5.9873046875, -5.375732421875, -4.76416015625, -4.152587890625, -3.541015625, -2.929443359375, -2.31787109375, -1.706298828125, -1.0947265625, -0.483154296875, 0.12841796875, 0.739990234375, 1.3515625, 1.963134765625, 2.57470703125, 3.186279296875, 3.7978515625, 4.409423828125, 5.02099609375, 5.632568359375, 6.244140625, 6.855712890625, 7.46728515625, 8.078857421875, 8.6904296875, 9.302001953125, 9.91357421875, 10.525146484375, 11.13671875, 11.748291015625, 12.35986328125, 12.971435546875, 13.5830078125, 14.194580078125, 14.80615234375, 15.417724609375, 16.029296875, 16.640869140625, 17.25244140625, 17.864013671875, 18.4755859375, 19.087158203125, 19.69873046875, 20.310302734375, 20.921875]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 2.0, 2.0, 3.0, 2.0, 4.0, 13.0, 10.0, 8.0, 19.0, 24.0, 22.0, 21.0, 26.0, 57.0, 59.0, 72.0, 97.0, 139.0, 182.0, 291.0, 385.0, 476.0, 528.0, 484.0, 353.0, 220.0, 149.0, 98.0, 87.0, 59.0, 49.0, 27.0, 32.0, 19.0, 8.0, 13.0, 14.0, 5.0, 5.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.7578125, -11.36865234375, -10.9794921875, -10.59033203125, -10.201171875, -9.81201171875, -9.4228515625, -9.03369140625, -8.64453125, -8.25537109375, -7.8662109375, -7.47705078125, -7.087890625, -6.69873046875, -6.3095703125, -5.92041015625, -5.53125, -5.14208984375, -4.7529296875, -4.36376953125, -3.974609375, -3.58544921875, -3.1962890625, -2.80712890625, -2.41796875, -2.02880859375, -1.6396484375, -1.25048828125, -0.861328125, -0.47216796875, -0.0830078125, 0.30615234375, 0.6953125, 1.08447265625, 1.4736328125, 1.86279296875, 2.251953125, 2.64111328125, 3.0302734375, 3.41943359375, 3.80859375, 4.19775390625, 4.5869140625, 4.97607421875, 5.365234375, 5.75439453125, 6.1435546875, 6.53271484375, 6.921875, 7.31103515625, 7.7001953125, 8.08935546875, 8.478515625, 8.86767578125, 9.2568359375, 9.64599609375, 10.03515625, 10.42431640625, 10.8134765625, 11.20263671875, 11.591796875, 11.98095703125, 12.3701171875, 12.75927734375, 13.1484375]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 0.0, 4.0, 1.0, 3.0, 10.0, 6.0, 12.0, 20.0, 30.0, 28.0, 57.0, 63.0, 113.0, 174.0, 333.0, 624.0, 1487.0, 3482.0, 10410.0, 36931.0, 179319.0, 2119541.0, 1646334.0, 149476.0, 31126.0, 8838.0, 3092.0, 1328.0, 572.0, 304.0, 166.0, 105.0, 87.0, 50.0, 36.0, 20.0, 25.0, 17.0, 8.0, 9.0, 12.0, 9.0, 5.0, 5.0, 6.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.84375, -19.20263671875, -18.5615234375, -17.92041015625, -17.279296875, -16.63818359375, -15.9970703125, -15.35595703125, -14.71484375, -14.07373046875, -13.4326171875, -12.79150390625, -12.150390625, -11.50927734375, -10.8681640625, -10.22705078125, -9.5859375, -8.94482421875, -8.3037109375, -7.66259765625, -7.021484375, -6.38037109375, -5.7392578125, -5.09814453125, -4.45703125, -3.81591796875, -3.1748046875, -2.53369140625, -1.892578125, -1.25146484375, -0.6103515625, 0.03076171875, 0.671875, 1.31298828125, 1.9541015625, 2.59521484375, 3.236328125, 3.87744140625, 4.5185546875, 5.15966796875, 5.80078125, 6.44189453125, 7.0830078125, 7.72412109375, 8.365234375, 9.00634765625, 9.6474609375, 10.28857421875, 10.9296875, 11.57080078125, 12.2119140625, 12.85302734375, 13.494140625, 14.13525390625, 14.7763671875, 15.41748046875, 16.05859375, 16.69970703125, 17.3408203125, 17.98193359375, 18.623046875, 19.26416015625, 19.9052734375, 20.54638671875, 21.1875]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 19.0, 44.0, 139.0, 290.0, 281.0, 151.0, 56.0, 19.0, 6.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-126.59783935546875, -122.66924285888672, -118.74064636230469, -114.81204986572266, -110.88345336914062, -106.9548568725586, -103.02626037597656, -99.09766387939453, -95.1690673828125, -91.24047088623047, -87.31187438964844, -83.3832778930664, -79.45468139648438, -75.52608489990234, -71.59748840332031, -67.66889190673828, -63.74029541015625, -59.81169891357422, -55.88310241699219, -51.954505920410156, -48.025909423828125, -44.097312927246094, -40.16871643066406, -36.24011993408203, -32.3115234375, -28.38292694091797, -24.454330444335938, -20.525733947753906, -16.597137451171875, -12.668540954589844, -8.739944458007812, -4.811347961425781, -0.8827438354492188, 3.0458526611328125, 6.974449157714844, 10.903045654296875, 14.831642150878906, 18.760238647460938, 22.68883514404297, 26.617431640625, 30.54602813720703, 34.47462463378906, 38.403221130371094, 42.331817626953125, 46.260414123535156, 50.18901062011719, 54.11760711669922, 58.04620361328125, 61.97480010986328, 65.90339660644531, 69.83199310302734, 73.76058959960938, 77.6891860961914, 81.61778259277344, 85.54637908935547, 89.4749755859375, 93.40357208251953, 97.33216857910156, 101.2607650756836, 105.18936157226562, 109.11795806884766, 113.04655456542969, 116.97515106201172, 120.90374755859375, 124.83234405517578]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 5.0, 5.0, 4.0, 10.0, 19.0, 15.0, 12.0, 18.0, 27.0, 24.0, 28.0, 19.0, 28.0, 29.0, 31.0, 40.0, 38.0, 35.0, 44.0, 65.0, 36.0, 57.0, 39.0, 44.0, 39.0, 36.0, 31.0, 28.0, 37.0, 24.0, 18.0, 17.0, 18.0, 24.0, 10.0, 15.0, 3.0, 3.0, 10.0, 9.0, 4.0, 3.0, 4.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-46.79145812988281, -45.34745788574219, -43.9034538269043, -42.45945358276367, -41.01544952392578, -39.571449279785156, -38.12744903564453, -36.683448791503906, -35.239444732666016, -33.79544448852539, -32.3514404296875, -30.907440185546875, -29.463438034057617, -28.01943588256836, -26.575435638427734, -25.131433486938477, -23.68743133544922, -22.24342918395996, -20.799427032470703, -19.355426788330078, -17.91142463684082, -16.467422485351562, -15.023421287536621, -13.57942008972168, -12.135417938232422, -10.691415786743164, -9.247414588928223, -7.803412914276123, -6.359411239624023, -4.915409564971924, -3.471407890319824, -2.027406692504883, -0.583404541015625, 0.8605971336364746, 2.304598808288574, 3.748600482940674, 5.192602157592773, 6.636603832244873, 8.080605506896973, 9.524606704711914, 10.968608856201172, 12.41261100769043, 13.856612205505371, 15.300613403320312, 16.74461555480957, 18.188617706298828, 19.632617950439453, 21.07662010192871, 22.52062225341797, 23.964624404907227, 25.408626556396484, 26.85262680053711, 28.296628952026367, 29.740631103515625, 31.18463134765625, 32.628631591796875, 34.072635650634766, 35.51663589477539, 36.96063995361328, 38.404640197753906, 39.84864044189453, 41.29264450073242, 42.73664474487305, 44.18064880371094, 45.62464904785156]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 2.0, 5.0, 5.0, 5.0, 4.0, 13.0, 7.0, 8.0, 14.0, 8.0, 21.0, 8.0, 12.0, 20.0, 27.0, 27.0, 32.0, 25.0, 31.0, 31.0, 31.0, 33.0, 41.0, 38.0, 34.0, 40.0, 46.0, 35.0, 31.0, 37.0, 32.0, 38.0, 18.0, 25.0, 42.0, 18.0, 17.0, 14.0, 14.0, 16.0, 16.0, 8.0, 12.0, 12.0, 10.0, 8.0, 9.0, 3.0, 4.0, 3.0, 6.0, 3.0, 2.0, 4.0, 2.0, 2.0, 0.0, 2.0], "bins": [-7.73828125, -7.49237060546875, -7.2464599609375, -7.00054931640625, -6.754638671875, -6.50872802734375, -6.2628173828125, -6.01690673828125, -5.77099609375, -5.52508544921875, -5.2791748046875, -5.03326416015625, -4.787353515625, -4.54144287109375, -4.2955322265625, -4.04962158203125, -3.8037109375, -3.55780029296875, -3.3118896484375, -3.06597900390625, -2.820068359375, -2.57415771484375, -2.3282470703125, -2.08233642578125, -1.83642578125, -1.59051513671875, -1.3446044921875, -1.09869384765625, -0.852783203125, -0.60687255859375, -0.3609619140625, -0.11505126953125, 0.130859375, 0.37677001953125, 0.6226806640625, 0.86859130859375, 1.114501953125, 1.36041259765625, 1.6063232421875, 1.85223388671875, 2.09814453125, 2.34405517578125, 2.5899658203125, 2.83587646484375, 3.081787109375, 3.32769775390625, 3.5736083984375, 3.81951904296875, 4.0654296875, 4.31134033203125, 4.5572509765625, 4.80316162109375, 5.049072265625, 5.29498291015625, 5.5408935546875, 5.78680419921875, 6.03271484375, 6.27862548828125, 6.5245361328125, 6.77044677734375, 7.016357421875, 7.26226806640625, 7.5081787109375, 7.75408935546875, 8.0]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 4.0, 9.0, 7.0, 15.0, 28.0, 45.0, 76.0, 100.0, 138.0, 287.0, 422.0, 621.0, 975.0, 1593.0, 2414.0, 3662.0, 5509.0, 8398.0, 12881.0, 19744.0, 29915.0, 45489.0, 69748.0, 102557.0, 142764.0, 165714.0, 139976.0, 100131.0, 67459.0, 43936.0, 29116.0, 18868.0, 12353.0, 8225.0, 5373.0, 3490.0, 2308.0, 1507.0, 924.0, 655.0, 433.0, 233.0, 173.0, 115.0, 65.0, 38.0, 25.0, 19.0, 7.0, 12.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.7734375, -0.7496109008789062, -0.7257843017578125, -0.7019577026367188, -0.678131103515625, -0.6543045043945312, -0.6304779052734375, -0.6066513061523438, -0.58282470703125, -0.5589981079101562, -0.5351715087890625, -0.5113449096679688, -0.487518310546875, -0.46369171142578125, -0.4398651123046875, -0.41603851318359375, -0.3922119140625, -0.36838531494140625, -0.3445587158203125, -0.32073211669921875, -0.296905517578125, -0.27307891845703125, -0.2492523193359375, -0.22542572021484375, -0.20159912109375, -0.17777252197265625, -0.1539459228515625, -0.13011932373046875, -0.106292724609375, -0.08246612548828125, -0.0586395263671875, -0.03481292724609375, -0.010986328125, 0.01284027099609375, 0.0366668701171875, 0.06049346923828125, 0.084320068359375, 0.10814666748046875, 0.1319732666015625, 0.15579986572265625, 0.17962646484375, 0.20345306396484375, 0.2272796630859375, 0.25110626220703125, 0.274932861328125, 0.29875946044921875, 0.3225860595703125, 0.34641265869140625, 0.3702392578125, 0.39406585693359375, 0.4178924560546875, 0.44171905517578125, 0.465545654296875, 0.48937225341796875, 0.5131988525390625, 0.5370254516601562, 0.56085205078125, 0.5846786499023438, 0.6085052490234375, 0.6323318481445312, 0.656158447265625, 0.6799850463867188, 0.7038116455078125, 0.7276382446289062, 0.75146484375]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 4.0, 7.0, 18.0, 14.0, 13.0, 26.0, 22.0, 30.0, 33.0, 30.0, 28.0, 34.0, 40.0, 46.0, 54.0, 47.0, 44.0, 1087.0, 55.0, 54.0, 40.0, 33.0, 46.0, 30.0, 30.0, 29.0, 31.0, 24.0, 17.0, 10.0, 16.0, 13.0, 11.0, 2.0, 3.0, 9.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-7.046875, -6.83404541015625, -6.6212158203125, -6.40838623046875, -6.195556640625, -5.98272705078125, -5.7698974609375, -5.55706787109375, -5.34423828125, -5.13140869140625, -4.9185791015625, -4.70574951171875, -4.492919921875, -4.28009033203125, -4.0672607421875, -3.85443115234375, -3.6416015625, -3.42877197265625, -3.2159423828125, -3.00311279296875, -2.790283203125, -2.57745361328125, -2.3646240234375, -2.15179443359375, -1.93896484375, -1.72613525390625, -1.5133056640625, -1.30047607421875, -1.087646484375, -0.87481689453125, -0.6619873046875, -0.44915771484375, -0.236328125, -0.02349853515625, 0.1893310546875, 0.40216064453125, 0.614990234375, 0.82781982421875, 1.0406494140625, 1.25347900390625, 1.46630859375, 1.67913818359375, 1.8919677734375, 2.10479736328125, 2.317626953125, 2.53045654296875, 2.7432861328125, 2.95611572265625, 3.1689453125, 3.38177490234375, 3.5946044921875, 3.80743408203125, 4.020263671875, 4.23309326171875, 4.4459228515625, 4.65875244140625, 4.87158203125, 5.08441162109375, 5.2972412109375, 5.51007080078125, 5.722900390625, 5.93572998046875, 6.1485595703125, 6.36138916015625, 6.57421875]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 8.0, 7.0, 15.0, 39.0, 72.0, 74.0, 119.0, 197.0, 319.0, 587.0, 952.0, 1558.0, 2712.0, 4492.0, 7300.0, 12253.0, 20097.0, 33125.0, 53363.0, 84543.0, 127512.0, 233118.0, 1151065.0, 131273.0, 88571.0, 55972.0, 34525.0, 21011.0, 12874.0, 7758.0, 4676.0, 2830.0, 1683.0, 893.0, 634.0, 356.0, 214.0, 140.0, 70.0, 45.0, 35.0, 17.0, 12.0, 12.0, 6.0, 1.0, 0.0, 2.0, 2.0, 3.0], "bins": [-0.8037109375, -0.7814178466796875, -0.759124755859375, -0.7368316650390625, -0.71453857421875, -0.6922454833984375, -0.669952392578125, -0.6476593017578125, -0.6253662109375, -0.6030731201171875, -0.580780029296875, -0.5584869384765625, -0.53619384765625, -0.5139007568359375, -0.491607666015625, -0.4693145751953125, -0.447021484375, -0.4247283935546875, -0.402435302734375, -0.3801422119140625, -0.35784912109375, -0.3355560302734375, -0.313262939453125, -0.2909698486328125, -0.2686767578125, -0.2463836669921875, -0.224090576171875, -0.2017974853515625, -0.17950439453125, -0.1572113037109375, -0.134918212890625, -0.1126251220703125, -0.09033203125, -0.0680389404296875, -0.045745849609375, -0.0234527587890625, -0.00115966796875, 0.0211334228515625, 0.043426513671875, 0.0657196044921875, 0.0880126953125, 0.1103057861328125, 0.132598876953125, 0.1548919677734375, 0.17718505859375, 0.1994781494140625, 0.221771240234375, 0.2440643310546875, 0.266357421875, 0.2886505126953125, 0.310943603515625, 0.3332366943359375, 0.35552978515625, 0.3778228759765625, 0.400115966796875, 0.4224090576171875, 0.4447021484375, 0.4669952392578125, 0.489288330078125, 0.5115814208984375, 0.53387451171875, 0.5561676025390625, 0.578460693359375, 0.6007537841796875, 0.623046875]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 4.0, 1.0, 2.0, 2.0, 1.0, 5.0, 3.0, 6.0, 2.0, 4.0, 8.0, 25.0, 28.0, 33.0, 50.0, 62.0, 69.0, 90.0, 118.0, 123.0, 79.0, 55.0, 68.0, 50.0, 32.0, 20.0, 14.0, 15.0, 7.0, 5.0, 5.0, 2.0, 8.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.006488800048828125, -0.006296992301940918, -0.006105184555053711, -0.005913376808166504, -0.005721569061279297, -0.00552976131439209, -0.005337953567504883, -0.005146145820617676, -0.004954338073730469, -0.004762530326843262, -0.004570722579956055, -0.004378914833068848, -0.004187107086181641, -0.003995299339294434, -0.0038034915924072266, -0.0036116838455200195, -0.0034198760986328125, -0.0032280683517456055, -0.0030362606048583984, -0.0028444528579711914, -0.0026526451110839844, -0.0024608373641967773, -0.0022690296173095703, -0.0020772218704223633, -0.0018854141235351562, -0.0016936063766479492, -0.0015017986297607422, -0.0013099908828735352, -0.0011181831359863281, -0.0009263753890991211, -0.0007345676422119141, -0.000542759895324707, -0.0003509521484375, -0.00015914440155029297, 3.266334533691406e-05, 0.0002244710922241211, 0.0004162788391113281, 0.0006080865859985352, 0.0007998943328857422, 0.0009917020797729492, 0.0011835098266601562, 0.0013753175735473633, 0.0015671253204345703, 0.0017589330673217773, 0.0019507408142089844, 0.0021425485610961914, 0.0023343563079833984, 0.0025261640548706055, 0.0027179718017578125, 0.0029097795486450195, 0.0031015872955322266, 0.0032933950424194336, 0.0034852027893066406, 0.0036770105361938477, 0.0038688182830810547, 0.004060626029968262, 0.004252433776855469, 0.004444241523742676, 0.004636049270629883, 0.00482785701751709, 0.005019664764404297, 0.005211472511291504, 0.005403280258178711, 0.005595088005065918, 0.005786895751953125]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 6.0, 8.0, 13.0, 10.0, 12.0, 21.0, 30.0, 32.0, 50.0, 78.0, 130.0, 188.0, 325.0, 794.0, 23484.0, 1019948.0, 2174.0, 519.0, 234.0, 156.0, 100.0, 82.0, 44.0, 32.0, 8.0, 12.0, 9.0, 12.0, 3.0, 6.0, 1.0, 5.0, 5.0, 2.0, 6.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1087646484375, -0.10517406463623047, -0.10158348083496094, -0.0979928970336914, -0.09440231323242188, -0.09081172943115234, -0.08722114562988281, -0.08363056182861328, -0.08003997802734375, -0.07644939422607422, -0.07285881042480469, -0.06926822662353516, -0.06567764282226562, -0.062087059020996094, -0.05849647521972656, -0.05490589141845703, -0.0513153076171875, -0.04772472381591797, -0.04413414001464844, -0.040543556213378906, -0.036952972412109375, -0.033362388610839844, -0.029771804809570312, -0.02618122100830078, -0.02259063720703125, -0.01900005340576172, -0.015409469604492188, -0.011818885803222656, -0.008228302001953125, -0.004637718200683594, -0.0010471343994140625, 0.0025434494018554688, 0.006134033203125, 0.009724617004394531, 0.013315200805664062, 0.016905784606933594, 0.020496368408203125, 0.024086952209472656, 0.027677536010742188, 0.03126811981201172, 0.03485870361328125, 0.03844928741455078, 0.04203987121582031, 0.045630455017089844, 0.049221038818359375, 0.052811622619628906, 0.05640220642089844, 0.05999279022216797, 0.0635833740234375, 0.06717395782470703, 0.07076454162597656, 0.0743551254272461, 0.07794570922851562, 0.08153629302978516, 0.08512687683105469, 0.08871746063232422, 0.09230804443359375, 0.09589862823486328, 0.09948921203613281, 0.10307979583740234, 0.10667037963867188, 0.1102609634399414, 0.11385154724121094, 0.11744213104248047, 0.12103271484375]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 63.0, 697.0, 237.0, 14.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02969544380903244, -0.029085952788591385, -0.02847646363079548, -0.027866972610354424, -0.027257483452558517, -0.026647992432117462, -0.026038503274321556, -0.0254290122538805, -0.024819523096084595, -0.02421003207564354, -0.023600542917847633, -0.022991051897406578, -0.022381562739610672, -0.021772071719169617, -0.02116258256137371, -0.020553091540932655, -0.01994360238313675, -0.019334111362695694, -0.018724622204899788, -0.018115131184458733, -0.017505642026662827, -0.01689615100622177, -0.016286661848425865, -0.01567717082798481, -0.015067679807543755, -0.014458189718425274, -0.013848699629306793, -0.013239209540188313, -0.012629719451069832, -0.012020229361951351, -0.01141073927283287, -0.010801248252391815, -0.010191758163273335, -0.009582268074154854, -0.008972777985036373, -0.008363287895917892, -0.007753797806799412, -0.007144307717680931, -0.006534817162901163, -0.005925327073782682, -0.005315836984664202, -0.004706346895545721, -0.00409685680642724, -0.003487366484478116, -0.0028778763953596354, -0.0022683863062411547, -0.0016588959842920303, -0.0010494058951735497, -0.00043991580605506897, 0.00016957434127107263, 0.0007790644885972142, 0.0013885546941310167, 0.0019980447832494974, 0.002607534872367978, 0.0032170251943171024, 0.003826515283435583, 0.004436005372554064, 0.0050454954616725445, 0.005654985550791025, 0.006264476105570793, 0.006873966194689274, 0.0074834562838077545, 0.008092946372926235, 0.008702436462044716, 0.009311926551163197]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 5.0, 2.0, 0.0, 4.0, 12.0, 3.0, 7.0, 12.0, 11.0, 8.0, 10.0, 16.0, 16.0, 19.0, 23.0, 25.0, 34.0, 25.0, 31.0, 33.0, 32.0, 38.0, 44.0, 38.0, 46.0, 29.0, 34.0, 43.0, 44.0, 43.0, 35.0, 30.0, 43.0, 33.0, 26.0, 22.0, 21.0, 18.0, 17.0, 16.0, 15.0, 8.0, 6.0, 9.0, 5.0, 10.0, 6.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0020622611045837402, -0.001985718496143818, -0.0019091758877038956, -0.0018326332792639732, -0.001756090670824051, -0.0016795480623841286, -0.0016030054539442062, -0.001526462845504284, -0.0014499202370643616, -0.0013733776286244392, -0.001296835020184517, -0.0012202924117445946, -0.0011437498033046722, -0.00106720719486475, -0.0009906645864248276, -0.0009141219779849052, -0.0008375793695449829, -0.0007610367611050606, -0.0006844941526651382, -0.0006079515442252159, -0.0005314089357852936, -0.00045486632734537125, -0.0003783237189054489, -0.0003017811104655266, -0.00022523850202560425, -0.00014869589358568192, -7.215328514575958e-05, 4.38932329416275e-06, 8.093193173408508e-05, 0.00015747454017400742, 0.00023401714861392975, 0.0003105597570538521, 0.0003871023654937744, 0.00046364497393369675, 0.0005401875823736191, 0.0006167301908135414, 0.0006932727992534637, 0.0007698154076933861, 0.0008463580161333084, 0.0009229006245732307, 0.000999443233013153, 0.0010759858414530754, 0.0011525284498929977, 0.00122907105833292, 0.0013056136667728424, 0.0013821562752127647, 0.001458698883652687, 0.0015352414920926094, 0.0016117841005325317, 0.001688326708972454, 0.0017648693174123764, 0.0018414119258522987, 0.001917954534292221, 0.0019944971427321434, 0.0020710397511720657, 0.002147582359611988, 0.0022241249680519104, 0.0023006675764918327, 0.002377210184931755, 0.0024537527933716774, 0.0025302954018115997, 0.002606838010251522, 0.0026833806186914444, 0.0027599232271313667, 0.002836465835571289]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 2.0, 5.0, 5.0, 5.0, 4.0, 13.0, 7.0, 8.0, 14.0, 8.0, 21.0, 8.0, 12.0, 20.0, 27.0, 27.0, 32.0, 25.0, 31.0, 31.0, 31.0, 33.0, 41.0, 38.0, 34.0, 40.0, 46.0, 35.0, 31.0, 36.0, 33.0, 38.0, 18.0, 25.0, 42.0, 18.0, 17.0, 14.0, 14.0, 16.0, 16.0, 8.0, 12.0, 12.0, 10.0, 8.0, 9.0, 3.0, 4.0, 3.0, 6.0, 3.0, 2.0, 4.0, 2.0, 2.0, 0.0, 2.0], "bins": [-7.73828125, -7.49237060546875, -7.2464599609375, -7.00054931640625, -6.754638671875, -6.50872802734375, -6.2628173828125, -6.01690673828125, -5.77099609375, -5.52508544921875, -5.2791748046875, -5.03326416015625, -4.787353515625, -4.54144287109375, -4.2955322265625, -4.04962158203125, -3.8037109375, -3.55780029296875, -3.3118896484375, -3.06597900390625, -2.820068359375, -2.57415771484375, -2.3282470703125, -2.08233642578125, -1.83642578125, -1.59051513671875, -1.3446044921875, -1.09869384765625, -0.852783203125, -0.60687255859375, -0.3609619140625, -0.11505126953125, 0.130859375, 0.37677001953125, 0.6226806640625, 0.86859130859375, 1.114501953125, 1.36041259765625, 1.6063232421875, 1.85223388671875, 2.09814453125, 2.34405517578125, 2.5899658203125, 2.83587646484375, 3.081787109375, 3.32769775390625, 3.5736083984375, 3.81951904296875, 4.0654296875, 4.31134033203125, 4.5572509765625, 4.80316162109375, 5.049072265625, 5.29498291015625, 5.5408935546875, 5.78680419921875, 6.03271484375, 6.27862548828125, 6.5245361328125, 6.77044677734375, 7.016357421875, 7.26226806640625, 7.5081787109375, 7.75408935546875, 8.0]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 5.0, 9.0, 9.0, 12.0, 20.0, 24.0, 36.0, 46.0, 63.0, 73.0, 103.0, 152.0, 177.0, 276.0, 378.0, 535.0, 809.0, 1350.0, 2199.0, 4275.0, 8286.0, 17543.0, 39348.0, 94978.0, 310848.0, 370471.0, 111253.0, 44667.0, 19946.0, 9313.0, 4657.0, 2453.0, 1409.0, 865.0, 559.0, 376.0, 250.0, 195.0, 141.0, 96.0, 99.0, 68.0, 59.0, 33.0, 28.0, 19.0, 14.0, 8.0, 11.0, 1.0, 5.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0], "bins": [-9.7265625, -9.42333984375, -9.1201171875, -8.81689453125, -8.513671875, -8.21044921875, -7.9072265625, -7.60400390625, -7.30078125, -6.99755859375, -6.6943359375, -6.39111328125, -6.087890625, -5.78466796875, -5.4814453125, -5.17822265625, -4.875, -4.57177734375, -4.2685546875, -3.96533203125, -3.662109375, -3.35888671875, -3.0556640625, -2.75244140625, -2.44921875, -2.14599609375, -1.8427734375, -1.53955078125, -1.236328125, -0.93310546875, -0.6298828125, -0.32666015625, -0.0234375, 0.27978515625, 0.5830078125, 0.88623046875, 1.189453125, 1.49267578125, 1.7958984375, 2.09912109375, 2.40234375, 2.70556640625, 3.0087890625, 3.31201171875, 3.615234375, 3.91845703125, 4.2216796875, 4.52490234375, 4.828125, 5.13134765625, 5.4345703125, 5.73779296875, 6.041015625, 6.34423828125, 6.6474609375, 6.95068359375, 7.25390625, 7.55712890625, 7.8603515625, 8.16357421875, 8.466796875, 8.77001953125, 9.0732421875, 9.37646484375, 9.6796875]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 3.0, 5.0, 5.0, 6.0, 14.0, 5.0, 7.0, 11.0, 17.0, 12.0, 13.0, 24.0, 18.0, 36.0, 35.0, 29.0, 24.0, 49.0, 52.0, 67.0, 80.0, 151.0, 1480.0, 314.0, 124.0, 75.0, 48.0, 40.0, 40.0, 41.0, 33.0, 31.0, 26.0, 24.0, 14.0, 18.0, 24.0, 14.0, 6.0, 15.0, 8.0, 5.0, 4.0, 3.0, 4.0, 7.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.796875, -17.134521484375, -16.47216796875, -15.809814453125, -15.1474609375, -14.485107421875, -13.82275390625, -13.160400390625, -12.498046875, -11.835693359375, -11.17333984375, -10.510986328125, -9.8486328125, -9.186279296875, -8.52392578125, -7.861572265625, -7.19921875, -6.536865234375, -5.87451171875, -5.212158203125, -4.5498046875, -3.887451171875, -3.22509765625, -2.562744140625, -1.900390625, -1.238037109375, -0.57568359375, 0.086669921875, 0.7490234375, 1.411376953125, 2.07373046875, 2.736083984375, 3.3984375, 4.060791015625, 4.72314453125, 5.385498046875, 6.0478515625, 6.710205078125, 7.37255859375, 8.034912109375, 8.697265625, 9.359619140625, 10.02197265625, 10.684326171875, 11.3466796875, 12.009033203125, 12.67138671875, 13.333740234375, 13.99609375, 14.658447265625, 15.32080078125, 15.983154296875, 16.6455078125, 17.307861328125, 17.97021484375, 18.632568359375, 19.294921875, 19.957275390625, 20.61962890625, 21.281982421875, 21.9443359375, 22.606689453125, 23.26904296875, 23.931396484375, 24.59375]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 3.0, 2.0, 3.0, 6.0, 17.0, 13.0, 21.0, 25.0, 29.0, 41.0, 70.0, 91.0, 165.0, 250.0, 450.0, 1363.0, 18100.0, 2900034.0, 218769.0, 4581.0, 736.0, 316.0, 203.0, 118.0, 72.0, 52.0, 51.0, 39.0, 29.0, 15.0, 11.0, 7.0, 11.0, 6.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.90625, -41.30419921875, -39.7021484375, -38.10009765625, -36.498046875, -34.89599609375, -33.2939453125, -31.69189453125, -30.08984375, -28.48779296875, -26.8857421875, -25.28369140625, -23.681640625, -22.07958984375, -20.4775390625, -18.87548828125, -17.2734375, -15.67138671875, -14.0693359375, -12.46728515625, -10.865234375, -9.26318359375, -7.6611328125, -6.05908203125, -4.45703125, -2.85498046875, -1.2529296875, 0.34912109375, 1.951171875, 3.55322265625, 5.1552734375, 6.75732421875, 8.359375, 9.96142578125, 11.5634765625, 13.16552734375, 14.767578125, 16.36962890625, 17.9716796875, 19.57373046875, 21.17578125, 22.77783203125, 24.3798828125, 25.98193359375, 27.583984375, 29.18603515625, 30.7880859375, 32.39013671875, 33.9921875, 35.59423828125, 37.1962890625, 38.79833984375, 40.400390625, 42.00244140625, 43.6044921875, 45.20654296875, 46.80859375, 48.41064453125, 50.0126953125, 51.61474609375, 53.216796875, 54.81884765625, 56.4208984375, 58.02294921875, 59.625]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 33.0, 93.0, 286.0, 353.0, 184.0, 46.0, 14.0, 2.0, 3.0, 1.0], "bins": [-146.693359375, -144.13621520996094, -141.5790557861328, -139.02191162109375, -136.46475219726562, -133.90760803222656, -131.3504638671875, -128.79330444335938, -126.23616027832031, -123.67900848388672, -121.12185668945312, -118.56471252441406, -116.00756072998047, -113.45040893554688, -110.89325714111328, -108.33610534667969, -105.7789535522461, -103.2218017578125, -100.6646499633789, -98.10750579833984, -95.55035400390625, -92.99320220947266, -90.43605041503906, -87.87889862060547, -85.32174682617188, -82.76459503173828, -80.20744323730469, -77.65029907226562, -75.09314727783203, -72.53599548339844, -69.97884368896484, -67.42169189453125, -64.86454010009766, -62.30738830566406, -59.750240325927734, -57.19308853149414, -54.63594055175781, -52.07878875732422, -49.521636962890625, -46.96448516845703, -44.40734100341797, -41.850189208984375, -39.29304122924805, -36.73588943481445, -34.178741455078125, -31.62158966064453, -29.064437866210938, -26.507287979125977, -23.950136184692383, -21.392986297607422, -18.835834503173828, -16.278684616088867, -13.721534729003906, -11.164384841918945, -8.607234001159668, -6.050083160400391, -3.4929332733154297, -0.9357829093933105, 1.6213674545288086, 4.178517818450928, 6.735668182373047, 9.292818069458008, 11.849968910217285, 14.407119750976562, 16.964269638061523]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 7.0, 7.0, 11.0, 7.0, 10.0, 9.0, 7.0, 13.0, 16.0, 21.0, 26.0, 25.0, 23.0, 30.0, 40.0, 31.0, 31.0, 37.0, 36.0, 39.0, 47.0, 41.0, 34.0, 41.0, 41.0, 38.0, 31.0, 32.0, 35.0, 33.0, 23.0, 26.0, 23.0, 12.0, 16.0, 14.0, 20.0, 16.0, 8.0, 10.0, 5.0, 9.0, 5.0, 4.0, 5.0, 1.0, 2.0, 2.0, 4.0, 0.0, 0.0, 2.0, 3.0], "bins": [-48.311767578125, -46.86762237548828, -45.4234733581543, -43.97932434082031, -42.535179138183594, -41.091033935546875, -39.64688491821289, -38.202735900878906, -36.75859069824219, -35.31444549560547, -33.870296478271484, -32.4261474609375, -30.98200225830078, -29.53785514831543, -28.093708038330078, -26.649560928344727, -25.205413818359375, -23.761266708374023, -22.317119598388672, -20.87297248840332, -19.42882537841797, -17.984678268432617, -16.540531158447266, -15.096384048461914, -13.652236938476562, -12.208089828491211, -10.76394271850586, -9.319795608520508, -7.875648498535156, -6.431501388549805, -4.987354278564453, -3.5432071685791016, -2.09906005859375, -0.6549129486083984, 0.7892341613769531, 2.2333812713623047, 3.6775283813476562, 5.121675491333008, 6.565822601318359, 8.009969711303711, 9.454116821289062, 10.898263931274414, 12.342411041259766, 13.786558151245117, 15.230705261230469, 16.67485237121582, 18.118999481201172, 19.563146591186523, 21.007293701171875, 22.451440811157227, 23.895587921142578, 25.33973503112793, 26.78388214111328, 28.228029251098633, 29.672176361083984, 31.116323471069336, 32.56047058105469, 34.004615783691406, 35.44876480102539, 36.892913818359375, 38.337059020996094, 39.78120422363281, 41.2253532409668, 42.66950225830078, 44.1136474609375]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 8.0, 5.0, 12.0, 11.0, 12.0, 10.0, 3.0, 12.0, 5.0, 21.0, 22.0, 26.0, 30.0, 20.0, 33.0, 39.0, 27.0, 29.0, 38.0, 37.0, 32.0, 42.0, 49.0, 39.0, 54.0, 35.0, 33.0, 31.0, 36.0, 19.0, 29.0, 27.0, 20.0, 18.0, 12.0, 17.0, 16.0, 9.0, 19.0, 9.0, 13.0, 2.0, 6.0, 8.0, 10.0, 3.0, 7.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0], "bins": [-8.15625, -7.90435791015625, -7.6524658203125, -7.40057373046875, -7.148681640625, -6.89678955078125, -6.6448974609375, -6.39300537109375, -6.14111328125, -5.88922119140625, -5.6373291015625, -5.38543701171875, -5.133544921875, -4.88165283203125, -4.6297607421875, -4.37786865234375, -4.1259765625, -3.87408447265625, -3.6221923828125, -3.37030029296875, -3.118408203125, -2.86651611328125, -2.6146240234375, -2.36273193359375, -2.11083984375, -1.85894775390625, -1.6070556640625, -1.35516357421875, -1.103271484375, -0.85137939453125, -0.5994873046875, -0.34759521484375, -0.095703125, 0.15618896484375, 0.4080810546875, 0.65997314453125, 0.911865234375, 1.16375732421875, 1.4156494140625, 1.66754150390625, 1.91943359375, 2.17132568359375, 2.4232177734375, 2.67510986328125, 2.927001953125, 3.17889404296875, 3.4307861328125, 3.68267822265625, 3.9345703125, 4.18646240234375, 4.4383544921875, 4.69024658203125, 4.942138671875, 5.19403076171875, 5.4459228515625, 5.69781494140625, 5.94970703125, 6.20159912109375, 6.4534912109375, 6.70538330078125, 6.957275390625, 7.20916748046875, 7.4610595703125, 7.71295166015625, 7.96484375]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 5.0, 8.0, 11.0, 12.0, 4.0, 14.0, 14.0, 19.0, 27.0, 44.0, 33.0, 58.0, 73.0, 108.0, 144.0, 179.0, 252.0, 362.0, 416.0, 3142.0, 4176288.0, 11109.0, 553.0, 359.0, 258.0, 198.0, 142.0, 105.0, 76.0, 64.0, 35.0, 42.0, 24.0, 21.0, 21.0, 14.0, 8.0, 9.0, 9.0, 8.0, 7.0, 5.0, 1.0, 5.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-149.5, -144.451171875, -139.40234375, -134.353515625, -129.3046875, -124.255859375, -119.20703125, -114.158203125, -109.109375, -104.060546875, -99.01171875, -93.962890625, -88.9140625, -83.865234375, -78.81640625, -73.767578125, -68.71875, -63.669921875, -58.62109375, -53.572265625, -48.5234375, -43.474609375, -38.42578125, -33.376953125, -28.328125, -23.279296875, -18.23046875, -13.181640625, -8.1328125, -3.083984375, 1.96484375, 7.013671875, 12.0625, 17.111328125, 22.16015625, 27.208984375, 32.2578125, 37.306640625, 42.35546875, 47.404296875, 52.453125, 57.501953125, 62.55078125, 67.599609375, 72.6484375, 77.697265625, 82.74609375, 87.794921875, 92.84375, 97.892578125, 102.94140625, 107.990234375, 113.0390625, 118.087890625, 123.13671875, 128.185546875, 133.234375, 138.283203125, 143.33203125, 148.380859375, 153.4296875, 158.478515625, 163.52734375, 168.576171875, 173.625]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 9.0, 9.0, 19.0, 21.0, 24.0, 49.0, 63.0, 94.0, 126.0, 226.0, 384.0, 682.0, 854.0, 585.0, 348.0, 170.0, 129.0, 84.0, 57.0, 32.0, 40.0, 22.0, 12.0, 12.0, 7.0, 5.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.578125, -18.990966796875, -18.40380859375, -17.816650390625, -17.2294921875, -16.642333984375, -16.05517578125, -15.468017578125, -14.880859375, -14.293701171875, -13.70654296875, -13.119384765625, -12.5322265625, -11.945068359375, -11.35791015625, -10.770751953125, -10.18359375, -9.596435546875, -9.00927734375, -8.422119140625, -7.8349609375, -7.247802734375, -6.66064453125, -6.073486328125, -5.486328125, -4.899169921875, -4.31201171875, -3.724853515625, -3.1376953125, -2.550537109375, -1.96337890625, -1.376220703125, -0.7890625, -0.201904296875, 0.38525390625, 0.972412109375, 1.5595703125, 2.146728515625, 2.73388671875, 3.321044921875, 3.908203125, 4.495361328125, 5.08251953125, 5.669677734375, 6.2568359375, 6.843994140625, 7.43115234375, 8.018310546875, 8.60546875, 9.192626953125, 9.77978515625, 10.366943359375, 10.9541015625, 11.541259765625, 12.12841796875, 12.715576171875, 13.302734375, 13.889892578125, 14.47705078125, 15.064208984375, 15.6513671875, 16.238525390625, 16.82568359375, 17.412841796875, 18.0]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 5.0, 6.0, 9.0, 8.0, 10.0, 19.0, 16.0, 18.0, 16.0, 16.0, 28.0, 37.0, 45.0, 52.0, 80.0, 148.0, 465.0, 7015.0, 3826648.0, 356646.0, 2273.0, 315.0, 103.0, 51.0, 47.0, 33.0, 37.0, 29.0, 27.0, 19.0, 10.0, 8.0, 12.0, 7.0, 11.0, 2.0, 2.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-80.875, -78.1650390625, -75.455078125, -72.7451171875, -70.03515625, -67.3251953125, -64.615234375, -61.9052734375, -59.1953125, -56.4853515625, -53.775390625, -51.0654296875, -48.35546875, -45.6455078125, -42.935546875, -40.2255859375, -37.515625, -34.8056640625, -32.095703125, -29.3857421875, -26.67578125, -23.9658203125, -21.255859375, -18.5458984375, -15.8359375, -13.1259765625, -10.416015625, -7.7060546875, -4.99609375, -2.2861328125, 0.423828125, 3.1337890625, 5.84375, 8.5537109375, 11.263671875, 13.9736328125, 16.68359375, 19.3935546875, 22.103515625, 24.8134765625, 27.5234375, 30.2333984375, 32.943359375, 35.6533203125, 38.36328125, 41.0732421875, 43.783203125, 46.4931640625, 49.203125, 51.9130859375, 54.623046875, 57.3330078125, 60.04296875, 62.7529296875, 65.462890625, 68.1728515625, 70.8828125, 73.5927734375, 76.302734375, 79.0126953125, 81.72265625, 84.4326171875, 87.142578125, 89.8525390625, 92.5625]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 20.0, 52.0, 135.0, 229.0, 230.0, 194.0, 85.0, 50.0, 9.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-102.47761535644531, -99.20384216308594, -95.93006896972656, -92.65629577636719, -89.38252258300781, -86.10874938964844, -82.83497619628906, -79.56120300292969, -76.28742980957031, -73.01365661621094, -69.73988342285156, -66.46611022949219, -63.19233703613281, -59.91856384277344, -56.6447868347168, -53.37101364135742, -50.09723663330078, -46.823463439941406, -43.54969024658203, -40.275917053222656, -37.00214385986328, -33.728370666503906, -30.454593658447266, -27.18082046508789, -23.907047271728516, -20.63327407836914, -17.359500885009766, -14.085725784301758, -10.811952590942383, -7.538179397583008, -4.264404296875, -0.990631103515625, 2.2831497192382812, 5.5569233894348145, 8.830697059631348, 12.104471206665039, 15.378244400024414, 18.65201759338379, 21.925792694091797, 25.199565887451172, 28.473339080810547, 31.747112274169922, 35.0208854675293, 38.29466247558594, 41.56843566894531, 44.84220886230469, 48.11598205566406, 51.38975524902344, 54.66352844238281, 57.93730163574219, 61.21107482910156, 64.48484802246094, 67.75862121582031, 71.03239440917969, 74.30616760253906, 77.57994079589844, 80.85371398925781, 84.12748718261719, 87.40126037597656, 90.67503356933594, 93.94880676269531, 97.22257995605469, 100.49635314941406, 103.77012634277344, 107.04390716552734]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 8.0, 3.0, 4.0, 5.0, 13.0, 13.0, 16.0, 19.0, 17.0, 18.0, 22.0, 23.0, 27.0, 36.0, 42.0, 33.0, 54.0, 41.0, 54.0, 42.0, 42.0, 42.0, 49.0, 51.0, 35.0, 28.0, 31.0, 25.0, 32.0, 24.0, 18.0, 29.0, 15.0, 15.0, 14.0, 15.0, 13.0, 11.0, 4.0, 6.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-46.605979919433594, -45.07762908935547, -43.54928207397461, -42.020931243896484, -40.49258041381836, -38.964229583740234, -37.435882568359375, -35.90753173828125, -34.379180908203125, -32.850830078125, -31.322481155395508, -29.794132232666016, -28.26578140258789, -26.7374324798584, -25.209083557128906, -23.68073272705078, -22.15238380432129, -20.624034881591797, -19.095684051513672, -17.56733512878418, -16.038984298706055, -14.510635375976562, -12.982285499572754, -11.453935623168945, -9.925585746765137, -8.397235870361328, -6.8688859939575195, -5.340536594390869, -3.8121867179870605, -2.283836841583252, -0.7554874420166016, 0.772862434387207, 2.3012123107910156, 3.829562187194824, 5.357912063598633, 6.886261463165283, 8.41461181640625, 9.942960739135742, 11.47131061553955, 12.99966049194336, 14.528010368347168, 16.056360244750977, 17.58470916748047, 19.113059997558594, 20.641408920288086, 22.16975975036621, 23.698108673095703, 25.226459503173828, 26.75480842590332, 28.283157348632812, 29.811508178710938, 31.33985710144043, 32.86820602416992, 34.39655685424805, 35.92490768432617, 37.45325469970703, 38.981605529785156, 40.50995635986328, 42.03830337524414, 43.566654205322266, 45.09500503540039, 46.623355865478516, 48.151702880859375, 49.6800537109375, 51.208404541015625]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 4.0, 3.0, 3.0, 5.0, 5.0, 9.0, 9.0, 6.0, 15.0, 16.0, 21.0, 24.0, 27.0, 18.0, 34.0, 29.0, 35.0, 33.0, 41.0, 38.0, 53.0, 43.0, 36.0, 39.0, 44.0, 39.0, 45.0, 47.0, 35.0, 30.0, 36.0, 29.0, 20.0, 20.0, 16.0, 23.0, 16.0, 12.0, 8.0, 6.0, 8.0, 8.0, 4.0, 3.0, 6.0, 4.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.9140625, -8.6273193359375, -8.340576171875, -8.0538330078125, -7.76708984375, -7.4803466796875, -7.193603515625, -6.9068603515625, -6.6201171875, -6.3333740234375, -6.046630859375, -5.7598876953125, -5.47314453125, -5.1864013671875, -4.899658203125, -4.6129150390625, -4.326171875, -4.0394287109375, -3.752685546875, -3.4659423828125, -3.17919921875, -2.8924560546875, -2.605712890625, -2.3189697265625, -2.0322265625, -1.7454833984375, -1.458740234375, -1.1719970703125, -0.88525390625, -0.5985107421875, -0.311767578125, -0.0250244140625, 0.26171875, 0.5484619140625, 0.835205078125, 1.1219482421875, 1.40869140625, 1.6954345703125, 1.982177734375, 2.2689208984375, 2.5556640625, 2.8424072265625, 3.129150390625, 3.4158935546875, 3.70263671875, 3.9893798828125, 4.276123046875, 4.5628662109375, 4.849609375, 5.1363525390625, 5.423095703125, 5.7098388671875, 5.99658203125, 6.2833251953125, 6.570068359375, 6.8568115234375, 7.1435546875, 7.4302978515625, 7.717041015625, 8.0037841796875, 8.29052734375, 8.5772705078125, 8.864013671875, 9.1507568359375, 9.4375]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 4.0, 4.0, 9.0, 13.0, 19.0, 30.0, 39.0, 56.0, 82.0, 127.0, 220.0, 274.0, 389.0, 586.0, 884.0, 1306.0, 1933.0, 2793.0, 4259.0, 6228.0, 9150.0, 14096.0, 20973.0, 32139.0, 49192.0, 74998.0, 110500.0, 148374.0, 161428.0, 132301.0, 93210.0, 62298.0, 40583.0, 26800.0, 17650.0, 11721.0, 7725.0, 5175.0, 3566.0, 2366.0, 1613.0, 1123.0, 714.0, 519.0, 333.0, 236.0, 159.0, 122.0, 75.0, 51.0, 33.0, 33.0, 15.0, 15.0, 10.0, 6.0, 3.0, 4.0, 3.0, 1.0, 2.0], "bins": [-0.72021484375, -0.6971893310546875, -0.674163818359375, -0.6511383056640625, -0.62811279296875, -0.6050872802734375, -0.582061767578125, -0.5590362548828125, -0.5360107421875, -0.5129852294921875, -0.489959716796875, -0.4669342041015625, -0.44390869140625, -0.4208831787109375, -0.397857666015625, -0.3748321533203125, -0.351806640625, -0.3287811279296875, -0.305755615234375, -0.2827301025390625, -0.25970458984375, -0.2366790771484375, -0.213653564453125, -0.1906280517578125, -0.1676025390625, -0.1445770263671875, -0.121551513671875, -0.0985260009765625, -0.07550048828125, -0.0524749755859375, -0.029449462890625, -0.0064239501953125, 0.0166015625, 0.0396270751953125, 0.062652587890625, 0.0856781005859375, 0.10870361328125, 0.1317291259765625, 0.154754638671875, 0.1777801513671875, 0.2008056640625, 0.2238311767578125, 0.246856689453125, 0.2698822021484375, 0.29290771484375, 0.3159332275390625, 0.338958740234375, 0.3619842529296875, 0.385009765625, 0.4080352783203125, 0.431060791015625, 0.4540863037109375, 0.47711181640625, 0.5001373291015625, 0.523162841796875, 0.5461883544921875, 0.5692138671875, 0.5922393798828125, 0.615264892578125, 0.6382904052734375, 0.66131591796875, 0.6843414306640625, 0.707366943359375, 0.7303924560546875, 0.75341796875]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 7.0, 3.0, 6.0, 5.0, 8.0, 9.0, 10.0, 11.0, 16.0, 19.0, 18.0, 24.0, 19.0, 33.0, 43.0, 40.0, 38.0, 46.0, 46.0, 36.0, 52.0, 1063.0, 61.0, 42.0, 44.0, 33.0, 38.0, 34.0, 36.0, 33.0, 24.0, 24.0, 23.0, 18.0, 13.0, 11.0, 10.0, 8.0, 2.0, 11.0, 2.0, 2.0, 5.0, 3.0, 1.0, 4.0, 3.0, 1.0, 1.0], "bins": [-7.29296875, -7.09478759765625, -6.8966064453125, -6.69842529296875, -6.500244140625, -6.30206298828125, -6.1038818359375, -5.90570068359375, -5.70751953125, -5.50933837890625, -5.3111572265625, -5.11297607421875, -4.914794921875, -4.71661376953125, -4.5184326171875, -4.32025146484375, -4.1220703125, -3.92388916015625, -3.7257080078125, -3.52752685546875, -3.329345703125, -3.13116455078125, -2.9329833984375, -2.73480224609375, -2.53662109375, -2.33843994140625, -2.1402587890625, -1.94207763671875, -1.743896484375, -1.54571533203125, -1.3475341796875, -1.14935302734375, -0.951171875, -0.75299072265625, -0.5548095703125, -0.35662841796875, -0.158447265625, 0.03973388671875, 0.2379150390625, 0.43609619140625, 0.63427734375, 0.83245849609375, 1.0306396484375, 1.22882080078125, 1.427001953125, 1.62518310546875, 1.8233642578125, 2.02154541015625, 2.2197265625, 2.41790771484375, 2.6160888671875, 2.81427001953125, 3.012451171875, 3.21063232421875, 3.4088134765625, 3.60699462890625, 3.80517578125, 4.00335693359375, 4.2015380859375, 4.39971923828125, 4.597900390625, 4.79608154296875, 4.9942626953125, 5.19244384765625, 5.390625]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 8.0, 14.0, 22.0, 29.0, 42.0, 91.0, 137.0, 201.0, 328.0, 559.0, 882.0, 1479.0, 2350.0, 3786.0, 6270.0, 9840.0, 15555.0, 24569.0, 38407.0, 60681.0, 92453.0, 130781.0, 1206477.0, 158106.0, 118844.0, 81881.0, 52651.0, 33791.0, 21154.0, 13419.0, 8306.0, 5426.0, 3288.0, 2038.0, 1281.0, 754.0, 502.0, 286.0, 173.0, 115.0, 61.0, 37.0, 26.0, 11.0, 11.0, 4.0, 2.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.64599609375, -0.6257095336914062, -0.6054229736328125, -0.5851364135742188, -0.564849853515625, -0.5445632934570312, -0.5242767333984375, -0.5039901733398438, -0.48370361328125, -0.46341705322265625, -0.4431304931640625, -0.42284393310546875, -0.402557373046875, -0.38227081298828125, -0.3619842529296875, -0.34169769287109375, -0.3214111328125, -0.30112457275390625, -0.2808380126953125, -0.26055145263671875, -0.240264892578125, -0.21997833251953125, -0.1996917724609375, -0.17940521240234375, -0.15911865234375, -0.13883209228515625, -0.1185455322265625, -0.09825897216796875, -0.077972412109375, -0.05768585205078125, -0.0373992919921875, -0.01711273193359375, 0.003173828125, 0.02346038818359375, 0.0437469482421875, 0.06403350830078125, 0.084320068359375, 0.10460662841796875, 0.1248931884765625, 0.14517974853515625, 0.16546630859375, 0.18575286865234375, 0.2060394287109375, 0.22632598876953125, 0.246612548828125, 0.26689910888671875, 0.2871856689453125, 0.30747222900390625, 0.3277587890625, 0.34804534912109375, 0.3683319091796875, 0.38861846923828125, 0.408905029296875, 0.42919158935546875, 0.4494781494140625, 0.46976470947265625, 0.49005126953125, 0.5103378295898438, 0.5306243896484375, 0.5509109497070312, 0.571197509765625, 0.5914840698242188, 0.6117706298828125, 0.6320571899414062, 0.65234375]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 3.0, 9.0, 9.0, 4.0, 3.0, 11.0, 10.0, 12.0, 18.0, 9.0, 18.0, 20.0, 31.0, 33.0, 29.0, 35.0, 27.0, 53.0, 62.0, 59.0, 60.0, 64.0, 53.0, 68.0, 44.0, 38.0, 43.0, 22.0, 26.0, 21.0, 22.0, 18.0, 6.0, 14.0, 8.0, 8.0, 4.0, 1.0, 9.0, 4.0, 3.0, 1.0, 7.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.0036296844482421875, -0.0035242438316345215, -0.0034188032150268555, -0.0033133625984191895, -0.0032079219818115234, -0.0031024813652038574, -0.0029970407485961914, -0.0028916001319885254, -0.0027861595153808594, -0.0026807188987731934, -0.0025752782821655273, -0.0024698376655578613, -0.0023643970489501953, -0.0022589564323425293, -0.0021535158157348633, -0.0020480751991271973, -0.0019426345825195312, -0.0018371939659118652, -0.0017317533493041992, -0.0016263127326965332, -0.0015208721160888672, -0.0014154314994812012, -0.0013099908828735352, -0.0012045502662658691, -0.0010991096496582031, -0.0009936690330505371, -0.0008882284164428711, -0.0007827877998352051, -0.0006773471832275391, -0.000571906566619873, -0.00046646595001220703, -0.000361025333404541, -0.000255584716796875, -0.00015014410018920898, -4.470348358154297e-05, 6.073713302612305e-05, 0.00016617774963378906, 0.0002716183662414551, 0.0003770589828491211, 0.0004824995994567871, 0.0005879402160644531, 0.0006933808326721191, 0.0007988214492797852, 0.0009042620658874512, 0.0010097026824951172, 0.0011151432991027832, 0.0012205839157104492, 0.0013260245323181152, 0.0014314651489257812, 0.0015369057655334473, 0.0016423463821411133, 0.0017477869987487793, 0.0018532276153564453, 0.0019586682319641113, 0.0020641088485717773, 0.0021695494651794434, 0.0022749900817871094, 0.0023804306983947754, 0.0024858713150024414, 0.0025913119316101074, 0.0026967525482177734, 0.0028021931648254395, 0.0029076337814331055, 0.0030130743980407715, 0.0031185150146484375]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 3.0, 1.0, 6.0, 4.0, 5.0, 8.0, 8.0, 12.0, 6.0, 8.0, 9.0, 16.0, 17.0, 16.0, 28.0, 49.0, 58.0, 60.0, 95.0, 118.0, 143.0, 209.0, 380.0, 636.0, 2082.0, 183891.0, 852706.0, 5818.0, 755.0, 423.0, 270.0, 159.0, 107.0, 98.0, 68.0, 53.0, 43.0, 32.0, 34.0, 27.0, 18.0, 19.0, 12.0, 8.0, 13.0, 10.0, 6.0, 7.0, 2.0, 3.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.057952880859375, -0.05596590042114258, -0.053978919982910156, -0.051991939544677734, -0.05000495910644531, -0.04801797866821289, -0.04603099822998047, -0.04404401779174805, -0.042057037353515625, -0.0400700569152832, -0.03808307647705078, -0.03609609603881836, -0.03410911560058594, -0.032122135162353516, -0.030135154724121094, -0.028148174285888672, -0.02616119384765625, -0.024174213409423828, -0.022187232971191406, -0.020200252532958984, -0.018213272094726562, -0.01622629165649414, -0.014239311218261719, -0.012252330780029297, -0.010265350341796875, -0.008278369903564453, -0.006291389465332031, -0.004304409027099609, -0.0023174285888671875, -0.0003304481506347656, 0.0016565322875976562, 0.003643512725830078, 0.0056304931640625, 0.007617473602294922, 0.009604454040527344, 0.011591434478759766, 0.013578414916992188, 0.01556539535522461, 0.01755237579345703, 0.019539356231689453, 0.021526336669921875, 0.023513317108154297, 0.02550029754638672, 0.02748727798461914, 0.029474258422851562, 0.031461238861083984, 0.033448219299316406, 0.03543519973754883, 0.03742218017578125, 0.03940916061401367, 0.041396141052246094, 0.043383121490478516, 0.04537010192871094, 0.04735708236694336, 0.04934406280517578, 0.0513310432434082, 0.053318023681640625, 0.05530500411987305, 0.05729198455810547, 0.05927896499633789, 0.06126594543457031, 0.06325292587280273, 0.06523990631103516, 0.06722688674926758, 0.0692138671875]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 11.0, 56.0, 357.0, 415.0, 129.0, 36.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01804562658071518, -0.01769249700009823, -0.017339367419481277, -0.016986237838864326, -0.016633108258247375, -0.016279976814985275, -0.015926849097013474, -0.015573718585073948, -0.015220588073134422, -0.014867458492517471, -0.01451432891190052, -0.01416119933128357, -0.013808068819344044, -0.013454939238727093, -0.013101809658110142, -0.01274868007749319, -0.01239555049687624, -0.012042420916259289, -0.011689291335642338, -0.011336160823702812, -0.010983031243085861, -0.01062990166246891, -0.01027677208185196, -0.009923642501235008, -0.009570512920618057, -0.009217383340001106, -0.008864253759384155, -0.008511124178767204, -0.008157993666827679, -0.007804864086210728, -0.007451734505593777, -0.007098604924976826, -0.006745473947376013, -0.006392344366759062, -0.0060392143204808235, -0.0056860847398638725, -0.0053329551592469215, -0.004979825112968683, -0.004626695532351732, -0.004273565486073494, -0.003920435905456543, -0.0035673060920089483, -0.0032141762785613537, -0.0028610466979444027, -0.002507916884496808, -0.0021547870710492134, -0.0018016574904322624, -0.0014485276769846678, -0.0010953978635370731, -0.0007422681082971394, -0.0003891383530572057, -3.600865602493286e-05, 0.0003171211574226618, 0.0006702509708702564, 0.0010233805514872074, 0.001376510364934802, 0.0017296401783823967, 0.0020827699918299913, 0.002435899805277586, 0.002789029385894537, 0.0031421591993421316, 0.0034952890127897263, 0.0038484185934066772, 0.004201548174023628, 0.0045546782203018665]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 8.0, 7.0, 6.0, 10.0, 5.0, 11.0, 15.0, 14.0, 21.0, 15.0, 14.0, 27.0, 10.0, 33.0, 30.0, 29.0, 33.0, 33.0, 23.0, 48.0, 34.0, 39.0, 34.0, 33.0, 35.0, 34.0, 36.0, 44.0, 38.0, 36.0, 25.0, 30.0, 20.0, 20.0, 24.0, 24.0, 15.0, 18.0, 18.0, 11.0, 8.0, 11.0, 5.0, 2.0, 7.0, 3.0, 6.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0018517374992370605, -0.0017941063269972801, -0.0017364751547574997, -0.0016788439825177193, -0.0016212128102779388, -0.0015635816380381584, -0.001505950465798378, -0.0014483192935585976, -0.0013906881213188171, -0.0013330569490790367, -0.0012754257768392563, -0.0012177946045994759, -0.0011601634323596954, -0.001102532260119915, -0.0010449010878801346, -0.0009872699156403542, -0.0009296387434005737, -0.0008720075711607933, -0.0008143763989210129, -0.0007567452266812325, -0.000699114054441452, -0.0006414828822016716, -0.0005838517099618912, -0.0005262205377221107, -0.0004685893654823303, -0.0004109581932425499, -0.00035332702100276947, -0.00029569584876298904, -0.00023806467652320862, -0.0001804335042834282, -0.00012280233204364777, -6.517115980386734e-05, -7.539987564086914e-06, 5.009118467569351e-05, 0.00010772235691547394, 0.00016535352915525436, 0.0002229847013950348, 0.0002806158736348152, 0.00033824704587459564, 0.00039587821811437607, 0.0004535093903541565, 0.0005111405625939369, 0.0005687717348337173, 0.0006264029070734978, 0.0006840340793132782, 0.0007416652515530586, 0.000799296423792839, 0.0008569275960326195, 0.0009145587682723999, 0.0009721899405121803, 0.0010298211127519608, 0.0010874522849917412, 0.0011450834572315216, 0.001202714629471302, 0.0012603458017110825, 0.0013179769739508629, 0.0013756081461906433, 0.0014332393184304237, 0.0014908704906702042, 0.0015485016629099846, 0.001606132835149765, 0.0016637640073895454, 0.0017213951796293259, 0.0017790263518691063, 0.0018366575241088867]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 4.0, 3.0, 3.0, 5.0, 5.0, 9.0, 9.0, 6.0, 15.0, 16.0, 21.0, 24.0, 27.0, 18.0, 34.0, 29.0, 35.0, 33.0, 41.0, 38.0, 53.0, 43.0, 36.0, 39.0, 44.0, 39.0, 45.0, 47.0, 35.0, 30.0, 36.0, 29.0, 20.0, 20.0, 16.0, 23.0, 16.0, 12.0, 8.0, 6.0, 8.0, 8.0, 4.0, 3.0, 6.0, 4.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.9140625, -8.6273193359375, -8.340576171875, -8.0538330078125, -7.76708984375, -7.4803466796875, -7.193603515625, -6.9068603515625, -6.6201171875, -6.3333740234375, -6.046630859375, -5.7598876953125, -5.47314453125, -5.1864013671875, -4.899658203125, -4.6129150390625, -4.326171875, -4.0394287109375, -3.752685546875, -3.4659423828125, -3.17919921875, -2.8924560546875, -2.605712890625, -2.3189697265625, -2.0322265625, -1.7454833984375, -1.458740234375, -1.1719970703125, -0.88525390625, -0.5985107421875, -0.311767578125, -0.0250244140625, 0.26171875, 0.5484619140625, 0.835205078125, 1.1219482421875, 1.40869140625, 1.6954345703125, 1.982177734375, 2.2689208984375, 2.5556640625, 2.8424072265625, 3.129150390625, 3.4158935546875, 3.70263671875, 3.9893798828125, 4.276123046875, 4.5628662109375, 4.849609375, 5.1363525390625, 5.423095703125, 5.7098388671875, 5.99658203125, 6.2833251953125, 6.570068359375, 6.8568115234375, 7.1435546875, 7.4302978515625, 7.717041015625, 8.0037841796875, 8.29052734375, 8.5772705078125, 8.864013671875, 9.1507568359375, 9.4375]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 6.0, 6.0, 5.0, 15.0, 12.0, 19.0, 19.0, 20.0, 41.0, 50.0, 81.0, 95.0, 148.0, 188.0, 222.0, 262.0, 406.0, 609.0, 756.0, 1159.0, 1853.0, 3643.0, 9085.0, 31994.0, 156486.0, 578455.0, 201604.0, 40311.0, 10594.0, 4043.0, 1997.0, 1270.0, 838.0, 623.0, 433.0, 282.0, 213.0, 177.0, 128.0, 104.0, 86.0, 54.0, 40.0, 35.0, 23.0, 21.0, 8.0, 12.0, 9.0, 8.0, 6.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-15.359375, -14.8729248046875, -14.386474609375, -13.9000244140625, -13.41357421875, -12.9271240234375, -12.440673828125, -11.9542236328125, -11.4677734375, -10.9813232421875, -10.494873046875, -10.0084228515625, -9.52197265625, -9.0355224609375, -8.549072265625, -8.0626220703125, -7.576171875, -7.0897216796875, -6.603271484375, -6.1168212890625, -5.63037109375, -5.1439208984375, -4.657470703125, -4.1710205078125, -3.6845703125, -3.1981201171875, -2.711669921875, -2.2252197265625, -1.73876953125, -1.2523193359375, -0.765869140625, -0.2794189453125, 0.20703125, 0.6934814453125, 1.179931640625, 1.6663818359375, 2.15283203125, 2.6392822265625, 3.125732421875, 3.6121826171875, 4.0986328125, 4.5850830078125, 5.071533203125, 5.5579833984375, 6.04443359375, 6.5308837890625, 7.017333984375, 7.5037841796875, 7.990234375, 8.4766845703125, 8.963134765625, 9.4495849609375, 9.93603515625, 10.4224853515625, 10.908935546875, 11.3953857421875, 11.8818359375, 12.3682861328125, 12.854736328125, 13.3411865234375, 13.82763671875, 14.3140869140625, 14.800537109375, 15.2869873046875, 15.7734375]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 6.0, 2.0, 6.0, 3.0, 5.0, 14.0, 15.0, 5.0, 16.0, 17.0, 25.0, 23.0, 37.0, 34.0, 46.0, 34.0, 66.0, 83.0, 163.0, 1496.0, 371.0, 123.0, 64.0, 53.0, 46.0, 40.0, 28.0, 29.0, 31.0, 33.0, 26.0, 20.0, 21.0, 12.0, 11.0, 12.0, 5.0, 7.0, 10.0, 11.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.96875, -21.28076171875, -20.5927734375, -19.90478515625, -19.216796875, -18.52880859375, -17.8408203125, -17.15283203125, -16.46484375, -15.77685546875, -15.0888671875, -14.40087890625, -13.712890625, -13.02490234375, -12.3369140625, -11.64892578125, -10.9609375, -10.27294921875, -9.5849609375, -8.89697265625, -8.208984375, -7.52099609375, -6.8330078125, -6.14501953125, -5.45703125, -4.76904296875, -4.0810546875, -3.39306640625, -2.705078125, -2.01708984375, -1.3291015625, -0.64111328125, 0.046875, 0.73486328125, 1.4228515625, 2.11083984375, 2.798828125, 3.48681640625, 4.1748046875, 4.86279296875, 5.55078125, 6.23876953125, 6.9267578125, 7.61474609375, 8.302734375, 8.99072265625, 9.6787109375, 10.36669921875, 11.0546875, 11.74267578125, 12.4306640625, 13.11865234375, 13.806640625, 14.49462890625, 15.1826171875, 15.87060546875, 16.55859375, 17.24658203125, 17.9345703125, 18.62255859375, 19.310546875, 19.99853515625, 20.6865234375, 21.37451171875, 22.0625]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 8.0, 6.0, 0.0, 6.0, 7.0, 10.0, 7.0, 12.0, 15.0, 12.0, 29.0, 20.0, 34.0, 33.0, 54.0, 83.0, 131.0, 203.0, 407.0, 788.0, 3044.0, 3091129.0, 47132.0, 1279.0, 506.0, 275.0, 138.0, 102.0, 61.0, 37.0, 38.0, 19.0, 23.0, 11.0, 9.0, 9.0, 5.0, 2.0, 4.0, 10.0, 5.0, 1.0, 2.0, 3.0, 4.0, 0.0, 0.0, 4.0], "bins": [-102.3125, -99.6015625, -96.890625, -94.1796875, -91.46875, -88.7578125, -86.046875, -83.3359375, -80.625, -77.9140625, -75.203125, -72.4921875, -69.78125, -67.0703125, -64.359375, -61.6484375, -58.9375, -56.2265625, -53.515625, -50.8046875, -48.09375, -45.3828125, -42.671875, -39.9609375, -37.25, -34.5390625, -31.828125, -29.1171875, -26.40625, -23.6953125, -20.984375, -18.2734375, -15.5625, -12.8515625, -10.140625, -7.4296875, -4.71875, -2.0078125, 0.703125, 3.4140625, 6.125, 8.8359375, 11.546875, 14.2578125, 16.96875, 19.6796875, 22.390625, 25.1015625, 27.8125, 30.5234375, 33.234375, 35.9453125, 38.65625, 41.3671875, 44.078125, 46.7890625, 49.5, 52.2109375, 54.921875, 57.6328125, 60.34375, 63.0546875, 65.765625, 68.4765625, 71.1875]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 18.0, 597.0, 395.0, 7.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-222.3544921875, -212.21298217773438, -202.07147216796875, -191.92994689941406, -181.78843688964844, -171.6469268798828, -161.50540161132812, -151.3638916015625, -141.22238159179688, -131.08087158203125, -120.9393539428711, -110.79783630371094, -100.65632629394531, -90.51481628417969, -80.37329864501953, -70.23178100585938, -60.09027099609375, -49.94875717163086, -39.80724334716797, -29.665729522705078, -19.524215698242188, -9.382701873779297, 0.7588119506835938, 10.90032958984375, 21.041839599609375, 31.183353424072266, 41.324867248535156, 51.46638107299805, 61.60789489746094, 71.74940490722656, 81.89092254638672, 92.03244018554688, 102.1739501953125, 112.31546020507812, 122.45697784423828, 132.59849548339844, 142.74000549316406, 152.8815155029297, 163.02304077148438, 173.16455078125, 183.30606079101562, 193.44757080078125, 203.58908081054688, 213.73060607910156, 223.8721160888672, 234.0136260986328, 244.1551513671875, 254.29666137695312, 264.43817138671875, 274.5796813964844, 284.72119140625, 294.8627014160156, 305.00421142578125, 315.145751953125, 325.2872619628906, 335.42877197265625, 345.5702819824219, 355.7117919921875, 365.8533020019531, 375.99481201171875, 386.1363525390625, 396.2778625488281, 406.41937255859375, 416.5608825683594, 426.702392578125]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 6.0, 4.0, 4.0, 3.0, 12.0, 5.0, 9.0, 8.0, 16.0, 16.0, 21.0, 15.0, 22.0, 26.0, 29.0, 32.0, 28.0, 28.0, 40.0, 32.0, 44.0, 41.0, 39.0, 35.0, 47.0, 47.0, 38.0, 50.0, 40.0, 29.0, 33.0, 32.0, 18.0, 27.0, 21.0, 26.0, 6.0, 6.0, 11.0, 21.0, 7.0, 5.0, 7.0, 6.0, 3.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-59.22264862060547, -57.51224899291992, -55.80184555053711, -54.09144592285156, -52.381046295166016, -50.67064666748047, -48.960243225097656, -47.24984359741211, -45.53944396972656, -43.829044342041016, -42.1186408996582, -40.408241271972656, -38.69784164428711, -36.98744201660156, -35.27703857421875, -33.5666389465332, -31.856237411499023, -30.145835876464844, -28.435436248779297, -26.725034713745117, -25.01463508605957, -23.30423355102539, -21.593833923339844, -19.883432388305664, -18.173030853271484, -16.462629318237305, -14.752229690551758, -13.041828155517578, -11.331428527832031, -9.621026992797852, -7.910626411437988, -6.200225830078125, -4.489826202392578, -2.779425621032715, -1.0690248012542725, 0.6413760185241699, 2.351776599884033, 4.062177658081055, 5.772578239440918, 7.482978820800781, 9.193379402160645, 10.903779983520508, 12.614180564880371, 14.324581146240234, 16.034982681274414, 17.745384216308594, 19.45578384399414, 21.166183471679688, 22.876585006713867, 24.586986541748047, 26.297386169433594, 28.007787704467773, 29.71818733215332, 31.4285888671875, 33.13898849487305, 34.849388122558594, 36.559791564941406, 38.27019119262695, 39.980594635009766, 41.69099426269531, 43.40139389038086, 45.111793518066406, 46.82219696044922, 48.532596588134766, 50.24299621582031]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 5.0, 4.0, 8.0, 6.0, 5.0, 13.0, 13.0, 19.0, 21.0, 32.0, 28.0, 30.0, 30.0, 38.0, 35.0, 46.0, 37.0, 38.0, 50.0, 43.0, 47.0, 40.0, 43.0, 40.0, 42.0, 38.0, 28.0, 34.0, 27.0, 22.0, 22.0, 33.0, 14.0, 10.0, 14.0, 9.0, 4.0, 6.0, 9.0, 5.0, 7.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.90625, -8.6092529296875, -8.312255859375, -8.0152587890625, -7.71826171875, -7.4212646484375, -7.124267578125, -6.8272705078125, -6.5302734375, -6.2332763671875, -5.936279296875, -5.6392822265625, -5.34228515625, -5.0452880859375, -4.748291015625, -4.4512939453125, -4.154296875, -3.8572998046875, -3.560302734375, -3.2633056640625, -2.96630859375, -2.6693115234375, -2.372314453125, -2.0753173828125, -1.7783203125, -1.4813232421875, -1.184326171875, -0.8873291015625, -0.59033203125, -0.2933349609375, 0.003662109375, 0.3006591796875, 0.59765625, 0.8946533203125, 1.191650390625, 1.4886474609375, 1.78564453125, 2.0826416015625, 2.379638671875, 2.6766357421875, 2.9736328125, 3.2706298828125, 3.567626953125, 3.8646240234375, 4.16162109375, 4.4586181640625, 4.755615234375, 5.0526123046875, 5.349609375, 5.6466064453125, 5.943603515625, 6.2406005859375, 6.53759765625, 6.8345947265625, 7.131591796875, 7.4285888671875, 7.7255859375, 8.0225830078125, 8.319580078125, 8.6165771484375, 8.91357421875, 9.2105712890625, 9.507568359375, 9.8045654296875, 10.1015625]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 7.0, 9.0, 10.0, 18.0, 21.0, 23.0, 34.0, 35.0, 45.0, 73.0, 86.0, 114.0, 167.0, 271.0, 416.0, 731.0, 1479.0, 3544.0, 9594.0, 43353.0, 379417.0, 2308499.0, 1278850.0, 136095.0, 20314.0, 5980.0, 2284.0, 1134.0, 566.0, 320.0, 221.0, 135.0, 111.0, 76.0, 57.0, 49.0, 33.0, 26.0, 18.0, 19.0, 10.0, 10.0, 8.0, 3.0, 6.0, 4.0, 6.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-17.96875, -17.420654296875, -16.87255859375, -16.324462890625, -15.7763671875, -15.228271484375, -14.68017578125, -14.132080078125, -13.583984375, -13.035888671875, -12.48779296875, -11.939697265625, -11.3916015625, -10.843505859375, -10.29541015625, -9.747314453125, -9.19921875, -8.651123046875, -8.10302734375, -7.554931640625, -7.0068359375, -6.458740234375, -5.91064453125, -5.362548828125, -4.814453125, -4.266357421875, -3.71826171875, -3.170166015625, -2.6220703125, -2.073974609375, -1.52587890625, -0.977783203125, -0.4296875, 0.118408203125, 0.66650390625, 1.214599609375, 1.7626953125, 2.310791015625, 2.85888671875, 3.406982421875, 3.955078125, 4.503173828125, 5.05126953125, 5.599365234375, 6.1474609375, 6.695556640625, 7.24365234375, 7.791748046875, 8.33984375, 8.887939453125, 9.43603515625, 9.984130859375, 10.5322265625, 11.080322265625, 11.62841796875, 12.176513671875, 12.724609375, 13.272705078125, 13.82080078125, 14.368896484375, 14.9169921875, 15.465087890625, 16.01318359375, 16.561279296875, 17.109375]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 6.0, 5.0, 12.0, 13.0, 23.0, 33.0, 38.0, 66.0, 97.0, 134.0, 191.0, 237.0, 504.0, 648.0, 675.0, 433.0, 292.0, 190.0, 141.0, 105.0, 64.0, 48.0, 35.0, 23.0, 20.0, 22.0, 10.0, 5.0, 5.0, 4.0, 1.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-24.03125, -23.4305419921875, -22.829833984375, -22.2291259765625, -21.62841796875, -21.0277099609375, -20.427001953125, -19.8262939453125, -19.2255859375, -18.6248779296875, -18.024169921875, -17.4234619140625, -16.82275390625, -16.2220458984375, -15.621337890625, -15.0206298828125, -14.419921875, -13.8192138671875, -13.218505859375, -12.6177978515625, -12.01708984375, -11.4163818359375, -10.815673828125, -10.2149658203125, -9.6142578125, -9.0135498046875, -8.412841796875, -7.8121337890625, -7.21142578125, -6.6107177734375, -6.010009765625, -5.4093017578125, -4.80859375, -4.2078857421875, -3.607177734375, -3.0064697265625, -2.40576171875, -1.8050537109375, -1.204345703125, -0.6036376953125, -0.0029296875, 0.5977783203125, 1.198486328125, 1.7991943359375, 2.39990234375, 3.0006103515625, 3.601318359375, 4.2020263671875, 4.802734375, 5.4034423828125, 6.004150390625, 6.6048583984375, 7.20556640625, 7.8062744140625, 8.406982421875, 9.0076904296875, 9.6083984375, 10.2091064453125, 10.809814453125, 11.4105224609375, 12.01123046875, 12.6119384765625, 13.212646484375, 13.8133544921875, 14.4140625]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 10.0, 8.0, 13.0, 17.0, 40.0, 69.0, 100.0, 177.0, 423.0, 799.0, 2374.0, 15468.0, 619857.0, 3490822.0, 57609.0, 4299.0, 1219.0, 461.0, 225.0, 130.0, 67.0, 45.0, 23.0, 7.0, 9.0, 8.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.3125, -42.00830078125, -40.7041015625, -39.39990234375, -38.095703125, -36.79150390625, -35.4873046875, -34.18310546875, -32.87890625, -31.57470703125, -30.2705078125, -28.96630859375, -27.662109375, -26.35791015625, -25.0537109375, -23.74951171875, -22.4453125, -21.14111328125, -19.8369140625, -18.53271484375, -17.228515625, -15.92431640625, -14.6201171875, -13.31591796875, -12.01171875, -10.70751953125, -9.4033203125, -8.09912109375, -6.794921875, -5.49072265625, -4.1865234375, -2.88232421875, -1.578125, -0.27392578125, 1.0302734375, 2.33447265625, 3.638671875, 4.94287109375, 6.2470703125, 7.55126953125, 8.85546875, 10.15966796875, 11.4638671875, 12.76806640625, 14.072265625, 15.37646484375, 16.6806640625, 17.98486328125, 19.2890625, 20.59326171875, 21.8974609375, 23.20166015625, 24.505859375, 25.81005859375, 27.1142578125, 28.41845703125, 29.72265625, 31.02685546875, 32.3310546875, 33.63525390625, 34.939453125, 36.24365234375, 37.5478515625, 38.85205078125, 40.15625]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 70.0, 849.0, 93.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-848.4249267578125, -831.959228515625, -815.4935302734375, -799.02783203125, -782.5621337890625, -766.096435546875, -749.6307373046875, -733.1650390625, -716.6993408203125, -700.233642578125, -683.7679443359375, -667.30224609375, -650.8365478515625, -634.370849609375, -617.9051513671875, -601.439453125, -584.9736938476562, -568.5079956054688, -552.0422973632812, -535.5765991210938, -519.1109008789062, -502.64520263671875, -486.1794738769531, -469.7137756347656, -453.2480773925781, -436.7823791503906, -420.3166809082031, -403.8509826660156, -387.38525390625, -370.9195556640625, -354.453857421875, -337.9881591796875, -321.5224609375, -305.0567626953125, -288.591064453125, -272.1253662109375, -255.65965270996094, -239.19395446777344, -222.72824096679688, -206.26254272460938, -189.79684448242188, -173.33114624023438, -156.86544799804688, -140.3997344970703, -123.93403625488281, -107.46833801269531, -91.00263214111328, -74.53692626953125, -58.07122802734375, -41.605525970458984, -25.13982391357422, -8.674121856689453, 7.7915802001953125, 24.257278442382812, 40.722984313964844, 57.188690185546875, 73.65438842773438, 90.12008666992188, 106.5857925415039, 123.05149841308594, 139.51719665527344, 155.98289489746094, 172.4486083984375, 188.914306640625, 205.3800048828125]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 4.0, 5.0, 3.0, 5.0, 13.0, 16.0, 18.0, 16.0, 18.0, 28.0, 23.0, 28.0, 38.0, 39.0, 37.0, 37.0, 37.0, 40.0, 39.0, 47.0, 52.0, 46.0, 37.0, 32.0, 46.0, 38.0, 39.0, 37.0, 24.0, 25.0, 23.0, 21.0, 16.0, 20.0, 7.0, 7.0, 12.0, 9.0, 3.0, 7.0, 2.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-54.67823028564453, -52.84877395629883, -51.01932144165039, -49.18986511230469, -47.360408782958984, -45.53095626831055, -43.701499938964844, -41.872047424316406, -40.0425910949707, -38.213134765625, -36.38368225097656, -34.55422592163086, -32.724769592285156, -30.89531707763672, -29.065860748291016, -27.236406326293945, -25.406949996948242, -23.577495574951172, -21.74803924560547, -19.9185848236084, -18.089130401611328, -16.259674072265625, -14.430219650268555, -12.600765228271484, -10.771309852600098, -8.941854476928711, -7.112400054931641, -5.282944679260254, -3.4534897804260254, -1.6240348815917969, 0.20542049407958984, 2.03487491607666, 3.864330291748047, 5.693785190582275, 7.523240089416504, 9.35269546508789, 11.182149887084961, 13.011605262756348, 14.841060638427734, 16.670515060424805, 18.499969482421875, 20.329423904418945, 22.15888023376465, 23.98833465576172, 25.81778907775879, 27.64724349975586, 29.476699829101562, 31.306154251098633, 33.13561248779297, 34.96506881713867, 36.79452133178711, 38.62397766113281, 40.453433990478516, 42.28288650512695, 44.112342834472656, 45.941795349121094, 47.7712516784668, 49.6007080078125, 51.43016052246094, 53.25961685180664, 55.089073181152344, 56.91852569580078, 58.747982025146484, 60.57743835449219, 62.406890869140625]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 9.0, 11.0, 10.0, 15.0, 24.0, 15.0, 21.0, 32.0, 26.0, 40.0, 36.0, 43.0, 28.0, 43.0, 41.0, 33.0, 41.0, 31.0, 45.0, 53.0, 46.0, 33.0, 43.0, 41.0, 24.0, 37.0, 40.0, 22.0, 17.0, 14.0, 12.0, 13.0, 11.0, 11.0, 11.0, 6.0, 4.0, 7.0, 4.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.625, -6.3929443359375, -6.160888671875, -5.9288330078125, -5.69677734375, -5.4647216796875, -5.232666015625, -5.0006103515625, -4.7685546875, -4.5364990234375, -4.304443359375, -4.0723876953125, -3.84033203125, -3.6082763671875, -3.376220703125, -3.1441650390625, -2.912109375, -2.6800537109375, -2.447998046875, -2.2159423828125, -1.98388671875, -1.7518310546875, -1.519775390625, -1.2877197265625, -1.0556640625, -0.8236083984375, -0.591552734375, -0.3594970703125, -0.12744140625, 0.1046142578125, 0.336669921875, 0.5687255859375, 0.80078125, 1.0328369140625, 1.264892578125, 1.4969482421875, 1.72900390625, 1.9610595703125, 2.193115234375, 2.4251708984375, 2.6572265625, 2.8892822265625, 3.121337890625, 3.3533935546875, 3.58544921875, 3.8175048828125, 4.049560546875, 4.2816162109375, 4.513671875, 4.7457275390625, 4.977783203125, 5.2098388671875, 5.44189453125, 5.6739501953125, 5.906005859375, 6.1380615234375, 6.3701171875, 6.6021728515625, 6.834228515625, 7.0662841796875, 7.29833984375, 7.5303955078125, 7.762451171875, 7.9945068359375, 8.2265625]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 0.0, 4.0, 8.0, 8.0, 19.0, 29.0, 36.0, 53.0, 76.0, 143.0, 215.0, 320.0, 550.0, 879.0, 1376.0, 2149.0, 3522.0, 5771.0, 9553.0, 15674.0, 26178.0, 44056.0, 74336.0, 122980.0, 186681.0, 199791.0, 140671.0, 86098.0, 50774.0, 30443.0, 17992.0, 10947.0, 6560.0, 4122.0, 2444.0, 1525.0, 984.0, 573.0, 333.0, 249.0, 143.0, 108.0, 63.0, 43.0, 28.0, 19.0, 13.0, 11.0, 4.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.73681640625, -0.7138900756835938, -0.6909637451171875, -0.6680374145507812, -0.645111083984375, -0.6221847534179688, -0.5992584228515625, -0.5763320922851562, -0.55340576171875, -0.5304794311523438, -0.5075531005859375, -0.48462677001953125, -0.461700439453125, -0.43877410888671875, -0.4158477783203125, -0.39292144775390625, -0.3699951171875, -0.34706878662109375, -0.3241424560546875, -0.30121612548828125, -0.278289794921875, -0.25536346435546875, -0.2324371337890625, -0.20951080322265625, -0.18658447265625, -0.16365814208984375, -0.1407318115234375, -0.11780548095703125, -0.094879150390625, -0.07195281982421875, -0.0490264892578125, -0.02610015869140625, -0.003173828125, 0.01975250244140625, 0.0426788330078125, 0.06560516357421875, 0.088531494140625, 0.11145782470703125, 0.1343841552734375, 0.15731048583984375, 0.18023681640625, 0.20316314697265625, 0.2260894775390625, 0.24901580810546875, 0.271942138671875, 0.29486846923828125, 0.3177947998046875, 0.34072113037109375, 0.3636474609375, 0.38657379150390625, 0.4095001220703125, 0.43242645263671875, 0.455352783203125, 0.47827911376953125, 0.5012054443359375, 0.5241317749023438, 0.54705810546875, 0.5699844360351562, 0.5929107666015625, 0.6158370971679688, 0.638763427734375, 0.6616897583007812, 0.6846160888671875, 0.7075424194335938, 0.73046875]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 4.0, 3.0, 1.0, 2.0, 5.0, 0.0, 6.0, 7.0, 9.0, 13.0, 13.0, 13.0, 19.0, 29.0, 23.0, 30.0, 27.0, 27.0, 31.0, 38.0, 23.0, 36.0, 47.0, 43.0, 44.0, 1066.0, 40.0, 36.0, 44.0, 30.0, 45.0, 27.0, 37.0, 26.0, 30.0, 16.0, 23.0, 24.0, 19.0, 15.0, 10.0, 17.0, 7.0, 9.0, 6.0, 5.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.125, -3.9837646484375, -3.842529296875, -3.7012939453125, -3.56005859375, -3.4188232421875, -3.277587890625, -3.1363525390625, -2.9951171875, -2.8538818359375, -2.712646484375, -2.5714111328125, -2.43017578125, -2.2889404296875, -2.147705078125, -2.0064697265625, -1.865234375, -1.7239990234375, -1.582763671875, -1.4415283203125, -1.30029296875, -1.1590576171875, -1.017822265625, -0.8765869140625, -0.7353515625, -0.5941162109375, -0.452880859375, -0.3116455078125, -0.17041015625, -0.0291748046875, 0.112060546875, 0.2532958984375, 0.39453125, 0.5357666015625, 0.677001953125, 0.8182373046875, 0.95947265625, 1.1007080078125, 1.241943359375, 1.3831787109375, 1.5244140625, 1.6656494140625, 1.806884765625, 1.9481201171875, 2.08935546875, 2.2305908203125, 2.371826171875, 2.5130615234375, 2.654296875, 2.7955322265625, 2.936767578125, 3.0780029296875, 3.21923828125, 3.3604736328125, 3.501708984375, 3.6429443359375, 3.7841796875, 3.9254150390625, 4.066650390625, 4.2078857421875, 4.34912109375, 4.4903564453125, 4.631591796875, 4.7728271484375, 4.9140625]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 5.0, 20.0, 15.0, 27.0, 38.0, 97.0, 124.0, 206.0, 362.0, 588.0, 976.0, 1532.0, 2561.0, 4113.0, 6887.0, 11023.0, 17610.0, 28208.0, 44353.0, 70664.0, 105537.0, 146669.0, 1215288.0, 146113.0, 105757.0, 69751.0, 45004.0, 27754.0, 17322.0, 11172.0, 6693.0, 4189.0, 2581.0, 1546.0, 913.0, 575.0, 351.0, 192.0, 118.0, 68.0, 41.0, 28.0, 27.0, 17.0, 11.0, 5.0, 1.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.59619140625, -0.5793952941894531, -0.5625991821289062, -0.5458030700683594, -0.5290069580078125, -0.5122108459472656, -0.49541473388671875, -0.4786186218261719, -0.461822509765625, -0.4450263977050781, -0.42823028564453125, -0.4114341735839844, -0.3946380615234375, -0.3778419494628906, -0.36104583740234375, -0.3442497253417969, -0.32745361328125, -0.3106575012207031, -0.29386138916015625, -0.2770652770996094, -0.2602691650390625, -0.24347305297851562, -0.22667694091796875, -0.20988082885742188, -0.193084716796875, -0.17628860473632812, -0.15949249267578125, -0.14269638061523438, -0.1259002685546875, -0.10910415649414062, -0.09230804443359375, -0.07551193237304688, -0.0587158203125, -0.041919708251953125, -0.02512359619140625, -0.008327484130859375, 0.0084686279296875, 0.025264739990234375, 0.04206085205078125, 0.058856964111328125, 0.075653076171875, 0.09244918823242188, 0.10924530029296875, 0.12604141235351562, 0.1428375244140625, 0.15963363647460938, 0.17642974853515625, 0.19322586059570312, 0.21002197265625, 0.22681808471679688, 0.24361419677734375, 0.2604103088378906, 0.2772064208984375, 0.2940025329589844, 0.31079864501953125, 0.3275947570800781, 0.344390869140625, 0.3611869812011719, 0.37798309326171875, 0.3947792053222656, 0.4115753173828125, 0.4283714294433594, 0.44516754150390625, 0.4619636535644531, 0.478759765625]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 0.0, 2.0, 7.0, 4.0, 8.0, 8.0, 9.0, 17.0, 16.0, 20.0, 26.0, 24.0, 22.0, 36.0, 36.0, 39.0, 58.0, 44.0, 46.0, 50.0, 39.0, 36.0, 50.0, 43.0, 46.0, 47.0, 33.0, 39.0, 34.0, 30.0, 22.0, 20.0, 15.0, 14.0, 17.0, 14.0, 10.0, 7.0, 7.0, 6.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.002166748046875, -0.0020940005779266357, -0.0020212531089782715, -0.0019485056400299072, -0.001875758171081543, -0.0018030107021331787, -0.0017302632331848145, -0.0016575157642364502, -0.001584768295288086, -0.0015120208263397217, -0.0014392733573913574, -0.0013665258884429932, -0.001293778419494629, -0.0012210309505462646, -0.0011482834815979004, -0.0010755360126495361, -0.0010027885437011719, -0.0009300410747528076, -0.0008572936058044434, -0.0007845461368560791, -0.0007117986679077148, -0.0006390511989593506, -0.0005663037300109863, -0.0004935562610626221, -0.0004208087921142578, -0.00034806132316589355, -0.0002753138542175293, -0.00020256638526916504, -0.00012981891632080078, -5.7071447372436523e-05, 1.5676021575927734e-05, 8.842349052429199e-05, 0.00016117095947265625, 0.0002339184284210205, 0.00030666589736938477, 0.000379413366317749, 0.0004521608352661133, 0.0005249083042144775, 0.0005976557731628418, 0.0006704032421112061, 0.0007431507110595703, 0.0008158981800079346, 0.0008886456489562988, 0.0009613931179046631, 0.0010341405868530273, 0.0011068880558013916, 0.0011796355247497559, 0.0012523829936981201, 0.0013251304626464844, 0.0013978779315948486, 0.0014706254005432129, 0.0015433728694915771, 0.0016161203384399414, 0.0016888678073883057, 0.00176161527633667, 0.0018343627452850342, 0.0019071102142333984, 0.0019798576831817627, 0.002052605152130127, 0.002125352621078491, 0.0021981000900268555, 0.0022708475589752197, 0.002343595027923584, 0.0024163424968719482, 0.0024890899658203125]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 7.0, 8.0, 10.0, 20.0, 19.0, 26.0, 26.0, 44.0, 40.0, 67.0, 73.0, 117.0, 158.0, 236.0, 308.0, 559.0, 1183.0, 60846.0, 975846.0, 6702.0, 783.0, 492.0, 289.0, 176.0, 137.0, 89.0, 74.0, 53.0, 50.0, 28.0, 28.0, 12.0, 15.0, 14.0, 5.0, 5.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0], "bins": [-0.06341552734375, -0.06175994873046875, -0.0601043701171875, -0.05844879150390625, -0.056793212890625, -0.05513763427734375, -0.0534820556640625, -0.05182647705078125, -0.0501708984375, -0.04851531982421875, -0.0468597412109375, -0.04520416259765625, -0.043548583984375, -0.04189300537109375, -0.0402374267578125, -0.03858184814453125, -0.03692626953125, -0.03527069091796875, -0.0336151123046875, -0.03195953369140625, -0.030303955078125, -0.02864837646484375, -0.0269927978515625, -0.02533721923828125, -0.023681640625, -0.02202606201171875, -0.0203704833984375, -0.01871490478515625, -0.017059326171875, -0.01540374755859375, -0.0137481689453125, -0.01209259033203125, -0.01043701171875, -0.00878143310546875, -0.0071258544921875, -0.00547027587890625, -0.003814697265625, -0.00215911865234375, -0.0005035400390625, 0.00115203857421875, 0.0028076171875, 0.00446319580078125, 0.0061187744140625, 0.00777435302734375, 0.009429931640625, 0.01108551025390625, 0.0127410888671875, 0.01439666748046875, 0.01605224609375, 0.01770782470703125, 0.0193634033203125, 0.02101898193359375, 0.022674560546875, 0.02433013916015625, 0.0259857177734375, 0.02764129638671875, 0.029296875, 0.03095245361328125, 0.0326080322265625, 0.03426361083984375, 0.035919189453125, 0.03757476806640625, 0.0392303466796875, 0.04088592529296875, 0.04254150390625]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 10.0, 524.0, 468.0, 14.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03573993593454361, -0.035077761858701706, -0.0344155915081501, -0.0337534174323082, -0.03309124708175659, -0.03242907300591469, -0.03176690265536308, -0.03110472857952118, -0.030442556366324425, -0.02978038415312767, -0.029118211939930916, -0.02845603972673416, -0.027793865650892258, -0.027131693437695503, -0.02646952122449875, -0.025807349011301994, -0.02514517679810524, -0.024483004584908485, -0.02382083237171173, -0.023158660158514977, -0.022496487945318222, -0.02183431386947632, -0.021172141656279564, -0.02050996944308281, -0.019847797229886055, -0.0191856250166893, -0.018523452803492546, -0.01786128059029579, -0.017199106514453888, -0.016536934301257133, -0.01587476208806038, -0.015212589874863625, -0.01455041766166687, -0.013888245448470116, -0.013226073235273361, -0.012563900090754032, -0.011901727877557278, -0.011239555664360523, -0.010577382519841194, -0.00991521030664444, -0.009253038093447685, -0.00859086588025093, -0.007928693667054176, -0.007266520522534847, -0.006604348309338093, -0.005942176096141338, -0.005280003417283297, -0.004617830738425255, -0.0039556585252285, -0.0032934860792011023, -0.002631313633173704, -0.001969141187146306, -0.001306968741118908, -0.0006447962950915098, 1.737615093588829e-05, 0.00067954882979393, 0.0013417210429906845, 0.0020038934890180826, 0.0026660659350454807, 0.003328238381072879, 0.003990410827100277, 0.004652583040297031, 0.005314755719155073, 0.005976928398013115, 0.006639100611209869]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 2.0, 4.0, 9.0, 8.0, 6.0, 16.0, 11.0, 16.0, 20.0, 24.0, 32.0, 26.0, 34.0, 37.0, 40.0, 43.0, 44.0, 39.0, 45.0, 44.0, 57.0, 27.0, 49.0, 51.0, 40.0, 32.0, 36.0, 26.0, 39.0, 29.0, 24.0, 17.0, 15.0, 11.0, 12.0, 15.0, 9.0, 4.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015895962715148926, -0.001541762612760067, -0.0014939289540052414, -0.0014460952952504158, -0.0013982616364955902, -0.0013504279777407646, -0.001302594318985939, -0.0012547606602311134, -0.0012069270014762878, -0.0011590933427214622, -0.0011112596839666367, -0.001063426025211811, -0.0010155923664569855, -0.0009677587077021599, -0.0009199250489473343, -0.0008720913901925087, -0.0008242577314376831, -0.0007764240726828575, -0.0007285904139280319, -0.0006807567551732063, -0.0006329230964183807, -0.0005850894376635551, -0.0005372557789087296, -0.000489422120153904, -0.00044158846139907837, -0.0003937548026442528, -0.0003459211438894272, -0.0002980874851346016, -0.000250253826379776, -0.0002024201676249504, -0.00015458650887012482, -0.00010675285011529922, -5.891919136047363e-05, -1.108553260564804e-05, 3.674812614917755e-05, 8.458178490400314e-05, 0.00013241544365882874, 0.00018024910241365433, 0.00022808276116847992, 0.0002759164199233055, 0.0003237500786781311, 0.0003715837374329567, 0.0004194173961877823, 0.0004672510549426079, 0.0005150847136974335, 0.0005629183724522591, 0.0006107520312070847, 0.0006585856899619102, 0.0007064193487167358, 0.0007542530074715614, 0.000802086666226387, 0.0008499203249812126, 0.0008977539837360382, 0.0009455876424908638, 0.0009934213012456894, 0.001041254960000515, 0.0010890886187553406, 0.0011369222775101662, 0.0011847559362649918, 0.0012325895950198174, 0.001280423253774643, 0.0013282569125294685, 0.0013760905712842941, 0.0014239242300391197, 0.0014717578887939453]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 7.0, 7.0, 11.0, 10.0, 15.0, 25.0, 15.0, 20.0, 32.0, 26.0, 40.0, 38.0, 41.0, 30.0, 42.0, 41.0, 33.0, 41.0, 30.0, 45.0, 53.0, 46.0, 35.0, 42.0, 41.0, 23.0, 38.0, 39.0, 22.0, 17.0, 14.0, 12.0, 13.0, 12.0, 10.0, 11.0, 6.0, 4.0, 7.0, 4.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.62109375, -6.38909912109375, -6.1571044921875, -5.92510986328125, -5.693115234375, -5.46112060546875, -5.2291259765625, -4.99713134765625, -4.76513671875, -4.53314208984375, -4.3011474609375, -4.06915283203125, -3.837158203125, -3.60516357421875, -3.3731689453125, -3.14117431640625, -2.9091796875, -2.67718505859375, -2.4451904296875, -2.21319580078125, -1.981201171875, -1.74920654296875, -1.5172119140625, -1.28521728515625, -1.05322265625, -0.82122802734375, -0.5892333984375, -0.35723876953125, -0.125244140625, 0.10675048828125, 0.3387451171875, 0.57073974609375, 0.802734375, 1.03472900390625, 1.2667236328125, 1.49871826171875, 1.730712890625, 1.96270751953125, 2.1947021484375, 2.42669677734375, 2.65869140625, 2.89068603515625, 3.1226806640625, 3.35467529296875, 3.586669921875, 3.81866455078125, 4.0506591796875, 4.28265380859375, 4.5146484375, 4.74664306640625, 4.9786376953125, 5.21063232421875, 5.442626953125, 5.67462158203125, 5.9066162109375, 6.13861083984375, 6.37060546875, 6.60260009765625, 6.8345947265625, 7.06658935546875, 7.298583984375, 7.53057861328125, 7.7625732421875, 7.99456787109375, 8.2265625]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 5.0, 3.0, 3.0, 5.0, 13.0, 9.0, 21.0, 21.0, 39.0, 40.0, 46.0, 70.0, 117.0, 148.0, 238.0, 379.0, 467.0, 710.0, 1119.0, 1819.0, 3093.0, 6273.0, 18845.0, 153711.0, 733705.0, 99624.0, 15065.0, 5263.0, 2838.0, 1631.0, 1017.0, 646.0, 532.0, 312.0, 218.0, 154.0, 98.0, 59.0, 69.0, 39.0, 33.0, 26.0, 10.0, 9.0, 5.0, 7.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-21.390625, -20.78662109375, -20.1826171875, -19.57861328125, -18.974609375, -18.37060546875, -17.7666015625, -17.16259765625, -16.55859375, -15.95458984375, -15.3505859375, -14.74658203125, -14.142578125, -13.53857421875, -12.9345703125, -12.33056640625, -11.7265625, -11.12255859375, -10.5185546875, -9.91455078125, -9.310546875, -8.70654296875, -8.1025390625, -7.49853515625, -6.89453125, -6.29052734375, -5.6865234375, -5.08251953125, -4.478515625, -3.87451171875, -3.2705078125, -2.66650390625, -2.0625, -1.45849609375, -0.8544921875, -0.25048828125, 0.353515625, 0.95751953125, 1.5615234375, 2.16552734375, 2.76953125, 3.37353515625, 3.9775390625, 4.58154296875, 5.185546875, 5.78955078125, 6.3935546875, 6.99755859375, 7.6015625, 8.20556640625, 8.8095703125, 9.41357421875, 10.017578125, 10.62158203125, 11.2255859375, 11.82958984375, 12.43359375, 13.03759765625, 13.6416015625, 14.24560546875, 14.849609375, 15.45361328125, 16.0576171875, 16.66162109375, 17.265625]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 8.0, 7.0, 4.0, 5.0, 15.0, 9.0, 15.0, 12.0, 21.0, 21.0, 18.0, 22.0, 35.0, 30.0, 37.0, 46.0, 65.0, 77.0, 123.0, 358.0, 1522.0, 186.0, 67.0, 45.0, 49.0, 32.0, 35.0, 30.0, 25.0, 22.0, 15.0, 13.0, 13.0, 13.0, 7.0, 10.0, 9.0, 2.0, 7.0, 6.0, 2.0, 2.0, 9.0, 2.0, 2.0, 2.0], "bins": [-21.671875, -21.1038818359375, -20.535888671875, -19.9678955078125, -19.39990234375, -18.8319091796875, -18.263916015625, -17.6959228515625, -17.1279296875, -16.5599365234375, -15.991943359375, -15.4239501953125, -14.85595703125, -14.2879638671875, -13.719970703125, -13.1519775390625, -12.583984375, -12.0159912109375, -11.447998046875, -10.8800048828125, -10.31201171875, -9.7440185546875, -9.176025390625, -8.6080322265625, -8.0400390625, -7.4720458984375, -6.904052734375, -6.3360595703125, -5.76806640625, -5.2000732421875, -4.632080078125, -4.0640869140625, -3.49609375, -2.9281005859375, -2.360107421875, -1.7921142578125, -1.22412109375, -0.6561279296875, -0.088134765625, 0.4798583984375, 1.0478515625, 1.6158447265625, 2.183837890625, 2.7518310546875, 3.31982421875, 3.8878173828125, 4.455810546875, 5.0238037109375, 5.591796875, 6.1597900390625, 6.727783203125, 7.2957763671875, 7.86376953125, 8.4317626953125, 8.999755859375, 9.5677490234375, 10.1357421875, 10.7037353515625, 11.271728515625, 11.8397216796875, 12.40771484375, 12.9757080078125, 13.543701171875, 14.1116943359375, 14.6796875]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 3.0, 5.0, 7.0, 10.0, 9.0, 12.0, 18.0, 29.0, 37.0, 42.0, 59.0, 86.0, 138.0, 227.0, 448.0, 1158.0, 21152.0, 3116365.0, 4051.0, 794.0, 375.0, 221.0, 135.0, 93.0, 77.0, 44.0, 29.0, 14.0, 13.0, 15.0, 12.0, 10.0, 6.0, 7.0, 6.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-78.8125, -76.58203125, -74.3515625, -72.12109375, -69.890625, -67.66015625, -65.4296875, -63.19921875, -60.96875, -58.73828125, -56.5078125, -54.27734375, -52.046875, -49.81640625, -47.5859375, -45.35546875, -43.125, -40.89453125, -38.6640625, -36.43359375, -34.203125, -31.97265625, -29.7421875, -27.51171875, -25.28125, -23.05078125, -20.8203125, -18.58984375, -16.359375, -14.12890625, -11.8984375, -9.66796875, -7.4375, -5.20703125, -2.9765625, -0.74609375, 1.484375, 3.71484375, 5.9453125, 8.17578125, 10.40625, 12.63671875, 14.8671875, 17.09765625, 19.328125, 21.55859375, 23.7890625, 26.01953125, 28.25, 30.48046875, 32.7109375, 34.94140625, 37.171875, 39.40234375, 41.6328125, 43.86328125, 46.09375, 48.32421875, 50.5546875, 52.78515625, 55.015625, 57.24609375, 59.4765625, 61.70703125, 63.9375]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 12.0, 88.0, 374.0, 434.0, 97.0, 10.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-115.78763580322266, -111.15155792236328, -106.51548767089844, -101.87940979003906, -97.24333190917969, -92.60725402832031, -87.97117614746094, -83.3351058959961, -78.69902801513672, -74.06295013427734, -69.4268798828125, -64.79080200195312, -60.15472412109375, -55.518646240234375, -50.882572174072266, -46.246498107910156, -41.61042022705078, -36.974342346191406, -32.3382682800293, -27.702192306518555, -23.066116333007812, -18.43004035949707, -13.793964385986328, -9.157890319824219, -4.521812438964844, 0.11426353454589844, 4.750339508056641, 9.386415481567383, 14.022491455078125, 18.658567428588867, 23.29464340209961, 27.93071746826172, 32.56678771972656, 37.20286560058594, 41.83893966674805, 46.475013732910156, 51.11109161376953, 55.747169494628906, 60.383243560791016, 65.01931762695312, 69.6553955078125, 74.29147338867188, 78.92755126953125, 83.5636215209961, 88.19969940185547, 92.83577728271484, 97.47184753417969, 102.10792541503906, 106.74400329589844, 111.38008117675781, 116.01615905761719, 120.65222930908203, 125.2883071899414, 129.92437744140625, 134.56045532226562, 139.196533203125, 143.83261108398438, 148.46868896484375, 153.10476684570312, 157.7408447265625, 162.37692260742188, 167.0129852294922, 171.64906311035156, 176.28514099121094, 180.9212188720703]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 3.0, 1.0, 3.0, 6.0, 9.0, 6.0, 6.0, 12.0, 14.0, 14.0, 16.0, 20.0, 22.0, 24.0, 26.0, 23.0, 41.0, 29.0, 26.0, 34.0, 24.0, 28.0, 43.0, 40.0, 43.0, 41.0, 32.0, 32.0, 40.0, 36.0, 37.0, 21.0, 29.0, 27.0, 16.0, 28.0, 20.0, 24.0, 20.0, 17.0, 7.0, 13.0, 4.0, 12.0, 13.0, 4.0, 6.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 3.0, 4.0], "bins": [-44.91546630859375, -43.57817840576172, -42.24089050292969, -40.903602600097656, -39.56631088256836, -38.22902297973633, -36.8917350769043, -35.554447174072266, -34.217159271240234, -32.8798713684082, -31.54258155822754, -30.205293655395508, -28.868005752563477, -27.530715942382812, -26.19342803955078, -24.85614013671875, -23.518850326538086, -22.181562423706055, -20.84427261352539, -19.50698471069336, -18.169696807861328, -16.832408905029297, -15.495119094848633, -14.157831192016602, -12.820542335510254, -11.483253479003906, -10.145965576171875, -8.808676719665527, -7.471388339996338, -6.134099960327148, -4.796811103820801, -3.4595232009887695, -2.122234344482422, -0.7849458456039429, 0.5523426532745361, 1.8896312713623047, 3.226919651031494, 4.564208030700684, 5.901496887207031, 7.2387847900390625, 8.57607364654541, 9.913362503051758, 11.250650405883789, 12.587939262390137, 13.925228118896484, 15.262516021728516, 16.599803924560547, 17.937091827392578, 19.274381637573242, 20.611669540405273, 21.948959350585938, 23.28624725341797, 24.62353515625, 25.96082305908203, 27.298112869262695, 28.635400772094727, 29.97269058227539, 31.309978485107422, 32.64726638793945, 33.98455810546875, 35.32184600830078, 36.65913391113281, 37.996421813964844, 39.333709716796875, 40.670997619628906]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 2.0, 8.0, 4.0, 8.0, 10.0, 13.0, 9.0, 12.0, 27.0, 17.0, 21.0, 20.0, 32.0, 27.0, 37.0, 30.0, 29.0, 23.0, 45.0, 37.0, 50.0, 52.0, 30.0, 44.0, 43.0, 43.0, 29.0, 30.0, 32.0, 24.0, 32.0, 20.0, 24.0, 26.0, 18.0, 14.0, 14.0, 11.0, 8.0, 8.0, 7.0, 9.0, 3.0, 3.0, 3.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 4.0], "bins": [-6.58984375, -6.369140625, -6.1484375, -5.927734375, -5.70703125, -5.486328125, -5.265625, -5.044921875, -4.82421875, -4.603515625, -4.3828125, -4.162109375, -3.94140625, -3.720703125, -3.5, -3.279296875, -3.05859375, -2.837890625, -2.6171875, -2.396484375, -2.17578125, -1.955078125, -1.734375, -1.513671875, -1.29296875, -1.072265625, -0.8515625, -0.630859375, -0.41015625, -0.189453125, 0.03125, 0.251953125, 0.47265625, 0.693359375, 0.9140625, 1.134765625, 1.35546875, 1.576171875, 1.796875, 2.017578125, 2.23828125, 2.458984375, 2.6796875, 2.900390625, 3.12109375, 3.341796875, 3.5625, 3.783203125, 4.00390625, 4.224609375, 4.4453125, 4.666015625, 4.88671875, 5.107421875, 5.328125, 5.548828125, 5.76953125, 5.990234375, 6.2109375, 6.431640625, 6.65234375, 6.873046875, 7.09375, 7.314453125, 7.53515625]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 6.0, 2.0, 7.0, 7.0, 18.0, 18.0, 30.0, 26.0, 31.0, 45.0, 71.0, 68.0, 102.0, 126.0, 178.0, 269.0, 333.0, 514.0, 737.0, 1216.0, 2095.0, 4366.0, 11827.0, 69532.0, 790289.0, 2655722.0, 590392.0, 46702.0, 9946.0, 3952.0, 2065.0, 1168.0, 725.0, 462.0, 316.0, 213.0, 172.0, 116.0, 110.0, 79.0, 54.0, 51.0, 25.0, 33.0, 18.0, 15.0, 10.0, 10.0, 10.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-14.2734375, -13.804443359375, -13.33544921875, -12.866455078125, -12.3974609375, -11.928466796875, -11.45947265625, -10.990478515625, -10.521484375, -10.052490234375, -9.58349609375, -9.114501953125, -8.6455078125, -8.176513671875, -7.70751953125, -7.238525390625, -6.76953125, -6.300537109375, -5.83154296875, -5.362548828125, -4.8935546875, -4.424560546875, -3.95556640625, -3.486572265625, -3.017578125, -2.548583984375, -2.07958984375, -1.610595703125, -1.1416015625, -0.672607421875, -0.20361328125, 0.265380859375, 0.734375, 1.203369140625, 1.67236328125, 2.141357421875, 2.6103515625, 3.079345703125, 3.54833984375, 4.017333984375, 4.486328125, 4.955322265625, 5.42431640625, 5.893310546875, 6.3623046875, 6.831298828125, 7.30029296875, 7.769287109375, 8.23828125, 8.707275390625, 9.17626953125, 9.645263671875, 10.1142578125, 10.583251953125, 11.05224609375, 11.521240234375, 11.990234375, 12.459228515625, 12.92822265625, 13.397216796875, 13.8662109375, 14.335205078125, 14.80419921875, 15.273193359375, 15.7421875]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 2.0, 6.0, 3.0, 13.0, 19.0, 29.0, 48.0, 79.0, 122.0, 205.0, 314.0, 537.0, 774.0, 718.0, 454.0, 310.0, 184.0, 113.0, 59.0, 32.0, 18.0, 16.0, 8.0, 3.0, 1.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.3671875, -13.7659912109375, -13.164794921875, -12.5635986328125, -11.96240234375, -11.3612060546875, -10.760009765625, -10.1588134765625, -9.5576171875, -8.9564208984375, -8.355224609375, -7.7540283203125, -7.15283203125, -6.5516357421875, -5.950439453125, -5.3492431640625, -4.748046875, -4.1468505859375, -3.545654296875, -2.9444580078125, -2.34326171875, -1.7420654296875, -1.140869140625, -0.5396728515625, 0.0615234375, 0.6627197265625, 1.263916015625, 1.8651123046875, 2.46630859375, 3.0675048828125, 3.668701171875, 4.2698974609375, 4.87109375, 5.4722900390625, 6.073486328125, 6.6746826171875, 7.27587890625, 7.8770751953125, 8.478271484375, 9.0794677734375, 9.6806640625, 10.2818603515625, 10.883056640625, 11.4842529296875, 12.08544921875, 12.6866455078125, 13.287841796875, 13.8890380859375, 14.490234375, 15.0914306640625, 15.692626953125, 16.2938232421875, 16.89501953125, 17.4962158203125, 18.097412109375, 18.6986083984375, 19.2998046875, 19.9010009765625, 20.502197265625, 21.1033935546875, 21.70458984375, 22.3057861328125, 22.906982421875, 23.5081787109375, 24.109375]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 5.0, 5.0, 15.0, 20.0, 31.0, 37.0, 85.0, 144.0, 321.0, 704.0, 2021.0, 18326.0, 3935917.0, 230169.0, 4321.0, 1166.0, 472.0, 229.0, 123.0, 77.0, 26.0, 24.0, 18.0, 2.0, 7.0, 6.0, 5.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-56.5625, -55.173828125, -53.78515625, -52.396484375, -51.0078125, -49.619140625, -48.23046875, -46.841796875, -45.453125, -44.064453125, -42.67578125, -41.287109375, -39.8984375, -38.509765625, -37.12109375, -35.732421875, -34.34375, -32.955078125, -31.56640625, -30.177734375, -28.7890625, -27.400390625, -26.01171875, -24.623046875, -23.234375, -21.845703125, -20.45703125, -19.068359375, -17.6796875, -16.291015625, -14.90234375, -13.513671875, -12.125, -10.736328125, -9.34765625, -7.958984375, -6.5703125, -5.181640625, -3.79296875, -2.404296875, -1.015625, 0.373046875, 1.76171875, 3.150390625, 4.5390625, 5.927734375, 7.31640625, 8.705078125, 10.09375, 11.482421875, 12.87109375, 14.259765625, 15.6484375, 17.037109375, 18.42578125, 19.814453125, 21.203125, 22.591796875, 23.98046875, 25.369140625, 26.7578125, 28.146484375, 29.53515625, 30.923828125, 32.3125]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 8.0, 25.0, 137.0, 277.0, 355.0, 164.0, 39.0, 9.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.05208587646484, -66.65472412109375, -62.257362365722656, -57.86000061035156, -53.46263885498047, -49.065277099609375, -44.66791915893555, -40.27055740356445, -35.87319564819336, -31.475833892822266, -27.078472137451172, -22.68111228942871, -18.283750534057617, -13.886388778686523, -9.489028930664062, -5.091667175292969, -0.694305419921875, 3.7030558586120605, 8.100417137145996, 12.497777938842773, 16.895139694213867, 21.29250144958496, 25.689861297607422, 30.087223052978516, 34.48458480834961, 38.8819465637207, 43.2793083190918, 47.676666259765625, 52.07402801513672, 56.47138977050781, 60.868751525878906, 65.26611328125, 69.66348266601562, 74.06084442138672, 78.45820617675781, 82.8555679321289, 87.2529296875, 91.6502914428711, 96.04765319824219, 100.44500732421875, 104.84237670898438, 109.23973846435547, 113.63710021972656, 118.03446197509766, 122.43182373046875, 126.82918548583984, 131.22654724121094, 135.6239013671875, 140.02127075195312, 144.4186248779297, 148.8159942626953, 153.21334838867188, 157.6107177734375, 162.00807189941406, 166.4054412841797, 170.80279541015625, 175.2001495361328, 179.59750366210938, 183.994873046875, 188.39222717285156, 192.7895965576172, 197.18695068359375, 201.58432006835938, 205.98167419433594, 210.37904357910156]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 4.0, 2.0, 7.0, 7.0, 5.0, 5.0, 14.0, 15.0, 11.0, 12.0, 20.0, 22.0, 29.0, 25.0, 22.0, 29.0, 33.0, 36.0, 24.0, 30.0, 44.0, 40.0, 42.0, 46.0, 47.0, 32.0, 42.0, 38.0, 29.0, 35.0, 32.0, 24.0, 28.0, 18.0, 18.0, 27.0, 13.0, 21.0, 13.0, 11.0, 12.0, 14.0, 4.0, 4.0, 9.0, 8.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0], "bins": [-42.887542724609375, -41.56871795654297, -40.24989318847656, -38.93106460571289, -37.612239837646484, -36.29341506958008, -34.97459030151367, -33.655765533447266, -32.336936950683594, -31.018112182617188, -29.69928550720215, -28.380460739135742, -27.061634063720703, -25.742809295654297, -24.42398452758789, -23.105159759521484, -21.786334991455078, -20.467510223388672, -19.148683547973633, -17.829858779907227, -16.511032104492188, -15.192207336425781, -13.873382568359375, -12.554556846618652, -11.23573112487793, -9.916905403137207, -8.598079681396484, -7.279254913330078, -5.9604291915893555, -4.641603469848633, -3.3227782249450684, -2.003952980041504, -0.6851272583007812, 0.6336982250213623, 1.9525237083435059, 3.2713491916656494, 4.590174674987793, 5.909000396728516, 7.22782564163208, 8.546650886535645, 9.865476608276367, 11.18430233001709, 12.503128051757812, 13.821952819824219, 15.140778541564941, 16.459604263305664, 17.77842903137207, 19.09725570678711, 20.416080474853516, 21.734905242919922, 23.05373191833496, 24.372556686401367, 25.691383361816406, 27.010208129882812, 28.32903289794922, 29.647857666015625, 30.966684341430664, 32.2855110168457, 33.60433578491211, 34.923160552978516, 36.24198532104492, 37.560813903808594, 38.879638671875, 40.198463439941406, 41.51728820800781]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 4.0, 10.0, 7.0, 8.0, 13.0, 20.0, 15.0, 14.0, 17.0, 31.0, 35.0, 36.0, 28.0, 22.0, 29.0, 33.0, 29.0, 38.0, 37.0, 32.0, 36.0, 52.0, 30.0, 37.0, 43.0, 40.0, 38.0, 34.0, 23.0, 25.0, 28.0, 22.0, 21.0, 26.0, 18.0, 15.0, 15.0, 5.0, 10.0, 5.0, 2.0, 4.0, 9.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.359375, -5.189697265625, -5.02001953125, -4.850341796875, -4.6806640625, -4.510986328125, -4.34130859375, -4.171630859375, -4.001953125, -3.832275390625, -3.66259765625, -3.492919921875, -3.3232421875, -3.153564453125, -2.98388671875, -2.814208984375, -2.64453125, -2.474853515625, -2.30517578125, -2.135498046875, -1.9658203125, -1.796142578125, -1.62646484375, -1.456787109375, -1.287109375, -1.117431640625, -0.94775390625, -0.778076171875, -0.6083984375, -0.438720703125, -0.26904296875, -0.099365234375, 0.0703125, 0.239990234375, 0.40966796875, 0.579345703125, 0.7490234375, 0.918701171875, 1.08837890625, 1.258056640625, 1.427734375, 1.597412109375, 1.76708984375, 1.936767578125, 2.1064453125, 2.276123046875, 2.44580078125, 2.615478515625, 2.78515625, 2.954833984375, 3.12451171875, 3.294189453125, 3.4638671875, 3.633544921875, 3.80322265625, 3.972900390625, 4.142578125, 4.312255859375, 4.48193359375, 4.651611328125, 4.8212890625, 4.990966796875, 5.16064453125, 5.330322265625, 5.5]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 7.0, 6.0, 5.0, 11.0, 23.0, 39.0, 60.0, 87.0, 128.0, 216.0, 280.0, 388.0, 570.0, 807.0, 1218.0, 1748.0, 2287.0, 3431.0, 5201.0, 7592.0, 11584.0, 17279.0, 26939.0, 42103.0, 63906.0, 96468.0, 136084.0, 163773.0, 146855.0, 108526.0, 72287.0, 47569.0, 30928.0, 19825.0, 13106.0, 8751.0, 5846.0, 3980.0, 2644.0, 1849.0, 1323.0, 829.0, 641.0, 433.0, 307.0, 215.0, 134.0, 104.0, 68.0, 32.0, 28.0, 15.0, 10.0, 9.0, 9.0, 6.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.446533203125, -0.4319648742675781, -0.41739654541015625, -0.4028282165527344, -0.3882598876953125, -0.3736915588378906, -0.35912322998046875, -0.3445549011230469, -0.329986572265625, -0.3154182434082031, -0.30084991455078125, -0.2862815856933594, -0.2717132568359375, -0.2571449279785156, -0.24257659912109375, -0.22800827026367188, -0.21343994140625, -0.19887161254882812, -0.18430328369140625, -0.16973495483398438, -0.1551666259765625, -0.14059829711914062, -0.12602996826171875, -0.11146163940429688, -0.096893310546875, -0.08232498168945312, -0.06775665283203125, -0.053188323974609375, -0.0386199951171875, -0.024051666259765625, -0.00948333740234375, 0.005084991455078125, 0.0196533203125, 0.034221649169921875, 0.04878997802734375, 0.06335830688476562, 0.0779266357421875, 0.09249496459960938, 0.10706329345703125, 0.12163162231445312, 0.136199951171875, 0.15076828002929688, 0.16533660888671875, 0.17990493774414062, 0.1944732666015625, 0.20904159545898438, 0.22360992431640625, 0.23817825317382812, 0.25274658203125, 0.2673149108886719, 0.28188323974609375, 0.2964515686035156, 0.3110198974609375, 0.3255882263183594, 0.34015655517578125, 0.3547248840332031, 0.369293212890625, 0.3838615417480469, 0.39842987060546875, 0.4129981994628906, 0.4275665283203125, 0.4421348571777344, 0.45670318603515625, 0.4712715148925781, 0.48583984375]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 2.0, 7.0, 5.0, 7.0, 13.0, 6.0, 6.0, 7.0, 14.0, 18.0, 11.0, 17.0, 28.0, 29.0, 35.0, 32.0, 29.0, 40.0, 36.0, 36.0, 31.0, 44.0, 1069.0, 43.0, 38.0, 38.0, 33.0, 40.0, 39.0, 33.0, 27.0, 33.0, 21.0, 28.0, 25.0, 30.0, 14.0, 12.0, 8.0, 9.0, 7.0, 4.0, 6.0, 4.0, 7.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.33203125, -3.21734619140625, -3.1026611328125, -2.98797607421875, -2.873291015625, -2.75860595703125, -2.6439208984375, -2.52923583984375, -2.41455078125, -2.29986572265625, -2.1851806640625, -2.07049560546875, -1.955810546875, -1.84112548828125, -1.7264404296875, -1.61175537109375, -1.4970703125, -1.38238525390625, -1.2677001953125, -1.15301513671875, -1.038330078125, -0.92364501953125, -0.8089599609375, -0.69427490234375, -0.57958984375, -0.46490478515625, -0.3502197265625, -0.23553466796875, -0.120849609375, -0.00616455078125, 0.1085205078125, 0.22320556640625, 0.337890625, 0.45257568359375, 0.5672607421875, 0.68194580078125, 0.796630859375, 0.91131591796875, 1.0260009765625, 1.14068603515625, 1.25537109375, 1.37005615234375, 1.4847412109375, 1.59942626953125, 1.714111328125, 1.82879638671875, 1.9434814453125, 2.05816650390625, 2.1728515625, 2.28753662109375, 2.4022216796875, 2.51690673828125, 2.631591796875, 2.74627685546875, 2.8609619140625, 2.97564697265625, 3.09033203125, 3.20501708984375, 3.3197021484375, 3.43438720703125, 3.549072265625, 3.66375732421875, 3.7784423828125, 3.89312744140625, 4.0078125]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 10.0, 11.0, 19.0, 28.0, 54.0, 70.0, 140.0, 230.0, 393.0, 609.0, 1145.0, 1863.0, 3087.0, 5359.0, 8868.0, 15267.0, 25898.0, 44093.0, 73825.0, 119166.0, 168667.0, 1232717.0, 149002.0, 99702.0, 60044.0, 35688.0, 21087.0, 12398.0, 7303.0, 4260.0, 2573.0, 1419.0, 858.0, 502.0, 305.0, 182.0, 131.0, 63.0, 40.0, 27.0, 16.0, 8.0, 6.0, 3.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.52783203125, -0.5124435424804688, -0.4970550537109375, -0.48166656494140625, -0.466278076171875, -0.45088958740234375, -0.4355010986328125, -0.42011260986328125, -0.40472412109375, -0.38933563232421875, -0.3739471435546875, -0.35855865478515625, -0.343170166015625, -0.32778167724609375, -0.3123931884765625, -0.29700469970703125, -0.2816162109375, -0.26622772216796875, -0.2508392333984375, -0.23545074462890625, -0.220062255859375, -0.20467376708984375, -0.1892852783203125, -0.17389678955078125, -0.15850830078125, -0.14311981201171875, -0.1277313232421875, -0.11234283447265625, -0.096954345703125, -0.08156585693359375, -0.0661773681640625, -0.05078887939453125, -0.035400390625, -0.02001190185546875, -0.0046234130859375, 0.01076507568359375, 0.026153564453125, 0.04154205322265625, 0.0569305419921875, 0.07231903076171875, 0.08770751953125, 0.10309600830078125, 0.1184844970703125, 0.13387298583984375, 0.149261474609375, 0.16464996337890625, 0.1800384521484375, 0.19542694091796875, 0.2108154296875, 0.22620391845703125, 0.2415924072265625, 0.25698089599609375, 0.272369384765625, 0.28775787353515625, 0.3031463623046875, 0.31853485107421875, 0.33392333984375, 0.34931182861328125, 0.3647003173828125, 0.38008880615234375, 0.395477294921875, 0.41086578369140625, 0.4262542724609375, 0.44164276123046875, 0.45703125]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 6.0, 12.0, 3.0, 17.0, 18.0, 19.0, 17.0, 25.0, 27.0, 29.0, 37.0, 33.0, 55.0, 49.0, 52.0, 55.0, 50.0, 57.0, 57.0, 65.0, 50.0, 34.0, 38.0, 39.0, 28.0, 31.0, 23.0, 25.0, 9.0, 9.0, 15.0, 7.0, 6.0, 5.0, 3.0, 2.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001773834228515625, -0.0017108023166656494, -0.0016477704048156738, -0.0015847384929656982, -0.0015217065811157227, -0.001458674669265747, -0.0013956427574157715, -0.001332610845565796, -0.0012695789337158203, -0.0012065470218658447, -0.0011435151100158691, -0.0010804831981658936, -0.001017451286315918, -0.0009544193744659424, -0.0008913874626159668, -0.0008283555507659912, -0.0007653236389160156, -0.00070229172706604, -0.0006392598152160645, -0.0005762279033660889, -0.0005131959915161133, -0.0004501640796661377, -0.0003871321678161621, -0.0003241002559661865, -0.00026106834411621094, -0.00019803643226623535, -0.00013500452041625977, -7.197260856628418e-05, -8.940696716308594e-06, 5.409121513366699e-05, 0.00011712312698364258, 0.00018015503883361816, 0.00024318695068359375, 0.00030621886253356934, 0.0003692507743835449, 0.0004322826862335205, 0.0004953145980834961, 0.0005583465099334717, 0.0006213784217834473, 0.0006844103336334229, 0.0007474422454833984, 0.000810474157333374, 0.0008735060691833496, 0.0009365379810333252, 0.0009995698928833008, 0.0010626018047332764, 0.001125633716583252, 0.0011886656284332275, 0.0012516975402832031, 0.0013147294521331787, 0.0013777613639831543, 0.0014407932758331299, 0.0015038251876831055, 0.001566857099533081, 0.0016298890113830566, 0.0016929209232330322, 0.0017559528350830078, 0.0018189847469329834, 0.001882016658782959, 0.0019450485706329346, 0.00200808048248291, 0.0020711123943328857, 0.0021341443061828613, 0.002197176218032837, 0.0022602081298828125]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 7.0, 5.0, 7.0, 10.0, 7.0, 14.0, 18.0, 19.0, 33.0, 32.0, 40.0, 50.0, 78.0, 99.0, 123.0, 204.0, 261.0, 397.0, 709.0, 2458.0, 891582.0, 149158.0, 1340.0, 603.0, 374.0, 249.0, 171.0, 125.0, 74.0, 60.0, 57.0, 49.0, 39.0, 27.0, 25.0, 14.0, 9.0, 14.0, 6.0, 6.0, 1.0, 3.0, 0.0, 3.0, 2.0, 2.0, 2.0, 1.0], "bins": [-0.04388427734375, -0.042693138122558594, -0.04150199890136719, -0.04031085968017578, -0.039119720458984375, -0.03792858123779297, -0.03673744201660156, -0.035546302795410156, -0.03435516357421875, -0.033164024353027344, -0.03197288513183594, -0.03078174591064453, -0.029590606689453125, -0.02839946746826172, -0.027208328247070312, -0.026017189025878906, -0.0248260498046875, -0.023634910583496094, -0.022443771362304688, -0.02125263214111328, -0.020061492919921875, -0.01887035369873047, -0.017679214477539062, -0.016488075256347656, -0.01529693603515625, -0.014105796813964844, -0.012914657592773438, -0.011723518371582031, -0.010532379150390625, -0.009341239929199219, -0.008150100708007812, -0.006958961486816406, -0.005767822265625, -0.004576683044433594, -0.0033855438232421875, -0.0021944046020507812, -0.001003265380859375, 0.00018787384033203125, 0.0013790130615234375, 0.0025701522827148438, 0.00376129150390625, 0.004952430725097656, 0.0061435699462890625, 0.007334709167480469, 0.008525848388671875, 0.009716987609863281, 0.010908126831054688, 0.012099266052246094, 0.0132904052734375, 0.014481544494628906, 0.015672683715820312, 0.01686382293701172, 0.018054962158203125, 0.01924610137939453, 0.020437240600585938, 0.021628379821777344, 0.02281951904296875, 0.024010658264160156, 0.025201797485351562, 0.02639293670654297, 0.027584075927734375, 0.02877521514892578, 0.029966354370117188, 0.031157493591308594, 0.0323486328125]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 15.0, 170.0, 627.0, 193.0, 6.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.007932843640446663, -0.007702961564064026, -0.007473079487681389, -0.007243197411298752, -0.007013315334916115, -0.006783433258533478, -0.0065535507164895535, -0.006323668640106916, -0.006093786563724279, -0.005863904487341642, -0.005634022410959005, -0.005404140334576368, -0.005174257792532444, -0.004944375716149807, -0.00471449363976717, -0.004484611563384533, -0.004254729487001896, -0.004024847410619259, -0.003794965334236622, -0.003565083025023341, -0.003335200948640704, -0.003105318872258067, -0.0028754365630447865, -0.0026455544866621494, -0.0024156724102795124, -0.0021857903338968754, -0.0019559082575142384, -0.0017260259483009577, -0.0014961438719183207, -0.0012662617955356836, -0.0010363796027377248, -0.0008064974099397659, -0.0005766157992184162, -0.0003467336646281183, -0.00011685153003782034, 0.0001130306045524776, 0.00034291273914277554, 0.0005727948155254126, 0.0008026770083233714, 0.0010325592011213303, 0.0012624412775039673, 0.0014923233538866043, 0.0017222055466845632, 0.001952087739482522, 0.002181969815865159, 0.002411851892247796, 0.0026417342014610767, 0.0028716162778437138, 0.003101498354226351, 0.003331380430608988, 0.003561262506991625, 0.0037911448162049055, 0.004021027125418186, 0.004250909201800823, 0.00448079127818346, 0.004710673354566097, 0.004940555430948734, 0.005170437507331371, 0.005400319583714008, 0.005630201660096645, 0.005860083736479282, 0.006089965812861919, 0.006319848354905844, 0.006549730431288481, 0.006779612507671118]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 5.0, 2.0, 7.0, 5.0, 7.0, 8.0, 10.0, 12.0, 16.0, 19.0, 24.0, 15.0, 21.0, 33.0, 20.0, 39.0, 32.0, 30.0, 32.0, 39.0, 40.0, 39.0, 46.0, 40.0, 42.0, 42.0, 38.0, 43.0, 48.0, 31.0, 30.0, 30.0, 20.0, 27.0, 31.0, 17.0, 17.0, 10.0, 16.0, 8.0, 5.0, 4.0, 3.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.0011107921600341797, -0.0010784519836306572, -0.0010461118072271347, -0.0010137716308236122, -0.0009814314544200897, -0.0009490912780165672, -0.0009167511016130447, -0.0008844109252095222, -0.0008520707488059998, -0.0008197305724024773, -0.0007873903959989548, -0.0007550502195954323, -0.0007227100431919098, -0.0006903698667883873, -0.0006580296903848648, -0.0006256895139813423, -0.0005933493375778198, -0.0005610091611742973, -0.0005286689847707748, -0.0004963288083672523, -0.00046398863196372986, -0.00043164845556020737, -0.0003993082791566849, -0.0003669681027531624, -0.0003346279263496399, -0.0003022877499461174, -0.0002699475735425949, -0.00023760739713907242, -0.00020526722073554993, -0.00017292704433202744, -0.00014058686792850494, -0.00010824669152498245, -7.590651512145996e-05, -4.356633871793747e-05, -1.1226162314414978e-05, 2.1114014089107513e-05, 5.3454190492630005e-05, 8.57943668961525e-05, 0.00011813454329967499, 0.00015047471970319748, 0.00018281489610671997, 0.00021515507251024246, 0.00024749524891376495, 0.00027983542531728745, 0.00031217560172080994, 0.00034451577812433243, 0.0003768559545278549, 0.0004091961309313774, 0.0004415363073348999, 0.0004738764837384224, 0.0005062166601419449, 0.0005385568365454674, 0.0005708970129489899, 0.0006032371893525124, 0.0006355773657560349, 0.0006679175421595573, 0.0007002577185630798, 0.0007325978949666023, 0.0007649380713701248, 0.0007972782477736473, 0.0008296184241771698, 0.0008619586005806923, 0.0008942987769842148, 0.0009266389533877373, 0.0009589791297912598]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 4.0, 10.0, 7.0, 8.0, 13.0, 20.0, 15.0, 14.0, 17.0, 31.0, 35.0, 36.0, 28.0, 22.0, 29.0, 33.0, 29.0, 39.0, 36.0, 32.0, 36.0, 52.0, 30.0, 37.0, 43.0, 40.0, 38.0, 34.0, 23.0, 25.0, 28.0, 22.0, 21.0, 27.0, 17.0, 15.0, 15.0, 5.0, 10.0, 5.0, 2.0, 4.0, 9.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.359375, -5.189697265625, -5.02001953125, -4.850341796875, -4.6806640625, -4.510986328125, -4.34130859375, -4.171630859375, -4.001953125, -3.832275390625, -3.66259765625, -3.492919921875, -3.3232421875, -3.153564453125, -2.98388671875, -2.814208984375, -2.64453125, -2.474853515625, -2.30517578125, -2.135498046875, -1.9658203125, -1.796142578125, -1.62646484375, -1.456787109375, -1.287109375, -1.117431640625, -0.94775390625, -0.778076171875, -0.6083984375, -0.438720703125, -0.26904296875, -0.099365234375, 0.0703125, 0.239990234375, 0.40966796875, 0.579345703125, 0.7490234375, 0.918701171875, 1.08837890625, 1.258056640625, 1.427734375, 1.597412109375, 1.76708984375, 1.936767578125, 2.1064453125, 2.276123046875, 2.44580078125, 2.615478515625, 2.78515625, 2.954833984375, 3.12451171875, 3.294189453125, 3.4638671875, 3.633544921875, 3.80322265625, 3.972900390625, 4.142578125, 4.312255859375, 4.48193359375, 4.651611328125, 4.8212890625, 4.990966796875, 5.16064453125, 5.330322265625, 5.5]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 6.0, 9.0, 6.0, 11.0, 27.0, 28.0, 17.0, 55.0, 62.0, 72.0, 121.0, 121.0, 201.0, 301.0, 446.0, 648.0, 1095.0, 1856.0, 3906.0, 10705.0, 38054.0, 201413.0, 604108.0, 140026.0, 28655.0, 8510.0, 3444.0, 1691.0, 1009.0, 604.0, 385.0, 279.0, 187.0, 134.0, 98.0, 73.0, 52.0, 33.0, 31.0, 26.0, 13.0, 7.0, 12.0, 7.0, 5.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.4296875, -9.12939453125, -8.8291015625, -8.52880859375, -8.228515625, -7.92822265625, -7.6279296875, -7.32763671875, -7.02734375, -6.72705078125, -6.4267578125, -6.12646484375, -5.826171875, -5.52587890625, -5.2255859375, -4.92529296875, -4.625, -4.32470703125, -4.0244140625, -3.72412109375, -3.423828125, -3.12353515625, -2.8232421875, -2.52294921875, -2.22265625, -1.92236328125, -1.6220703125, -1.32177734375, -1.021484375, -0.72119140625, -0.4208984375, -0.12060546875, 0.1796875, 0.47998046875, 0.7802734375, 1.08056640625, 1.380859375, 1.68115234375, 1.9814453125, 2.28173828125, 2.58203125, 2.88232421875, 3.1826171875, 3.48291015625, 3.783203125, 4.08349609375, 4.3837890625, 4.68408203125, 4.984375, 5.28466796875, 5.5849609375, 5.88525390625, 6.185546875, 6.48583984375, 6.7861328125, 7.08642578125, 7.38671875, 7.68701171875, 7.9873046875, 8.28759765625, 8.587890625, 8.88818359375, 9.1884765625, 9.48876953125, 9.7890625]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 8.0, 2.0, 2.0, 7.0, 6.0, 10.0, 9.0, 20.0, 17.0, 34.0, 35.0, 40.0, 52.0, 57.0, 61.0, 101.0, 282.0, 1688.0, 176.0, 104.0, 63.0, 46.0, 43.0, 46.0, 34.0, 25.0, 11.0, 16.0, 18.0, 9.0, 6.0, 7.0, 3.0, 2.0, 4.0, 0.0, 1.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.078125, -16.49560546875, -15.9130859375, -15.33056640625, -14.748046875, -14.16552734375, -13.5830078125, -13.00048828125, -12.41796875, -11.83544921875, -11.2529296875, -10.67041015625, -10.087890625, -9.50537109375, -8.9228515625, -8.34033203125, -7.7578125, -7.17529296875, -6.5927734375, -6.01025390625, -5.427734375, -4.84521484375, -4.2626953125, -3.68017578125, -3.09765625, -2.51513671875, -1.9326171875, -1.35009765625, -0.767578125, -0.18505859375, 0.3974609375, 0.97998046875, 1.5625, 2.14501953125, 2.7275390625, 3.31005859375, 3.892578125, 4.47509765625, 5.0576171875, 5.64013671875, 6.22265625, 6.80517578125, 7.3876953125, 7.97021484375, 8.552734375, 9.13525390625, 9.7177734375, 10.30029296875, 10.8828125, 11.46533203125, 12.0478515625, 12.63037109375, 13.212890625, 13.79541015625, 14.3779296875, 14.96044921875, 15.54296875, 16.12548828125, 16.7080078125, 17.29052734375, 17.873046875, 18.45556640625, 19.0380859375, 19.62060546875, 20.203125]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 6.0, 4.0, 12.0, 18.0, 21.0, 24.0, 26.0, 50.0, 82.0, 168.0, 284.0, 630.0, 2392.0, 3122660.0, 17465.0, 959.0, 383.0, 195.0, 117.0, 59.0, 41.0, 29.0, 22.0, 20.0, 7.0, 3.0, 8.0, 8.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-61.25, -59.53466796875, -57.8193359375, -56.10400390625, -54.388671875, -52.67333984375, -50.9580078125, -49.24267578125, -47.52734375, -45.81201171875, -44.0966796875, -42.38134765625, -40.666015625, -38.95068359375, -37.2353515625, -35.52001953125, -33.8046875, -32.08935546875, -30.3740234375, -28.65869140625, -26.943359375, -25.22802734375, -23.5126953125, -21.79736328125, -20.08203125, -18.36669921875, -16.6513671875, -14.93603515625, -13.220703125, -11.50537109375, -9.7900390625, -8.07470703125, -6.359375, -4.64404296875, -2.9287109375, -1.21337890625, 0.501953125, 2.21728515625, 3.9326171875, 5.64794921875, 7.36328125, 9.07861328125, 10.7939453125, 12.50927734375, 14.224609375, 15.93994140625, 17.6552734375, 19.37060546875, 21.0859375, 22.80126953125, 24.5166015625, 26.23193359375, 27.947265625, 29.66259765625, 31.3779296875, 33.09326171875, 34.80859375, 36.52392578125, 38.2392578125, 39.95458984375, 41.669921875, 43.38525390625, 45.1005859375, 46.81591796875, 48.53125]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 7.0, 204.0, 726.0, 76.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.03435516357422, -60.329872131347656, -56.625389099121094, -52.9209098815918, -49.216426849365234, -45.51194381713867, -41.807464599609375, -38.10298156738281, -34.39849853515625, -30.694015502929688, -26.989534378051758, -23.285053253173828, -19.580570220947266, -15.876087188720703, -12.171606063842773, -8.467124938964844, -4.762641906738281, -1.0581598281860352, 2.646322250366211, 6.350804328918457, 10.055286407470703, 13.759769439697266, 17.464250564575195, 21.168731689453125, 24.873214721679688, 28.57769775390625, 32.28218078613281, 35.98666000366211, 39.69114303588867, 43.395626068115234, 47.10010528564453, 50.804588317871094, 54.509063720703125, 58.21354675292969, 61.91802978515625, 65.62251281738281, 69.32699584960938, 73.03147888183594, 76.73595428466797, 80.44043731689453, 84.1449203491211, 87.84940338134766, 91.55388641357422, 95.25836944580078, 98.96284484863281, 102.66732788085938, 106.37181091308594, 110.0762939453125, 113.78077697753906, 117.48526000976562, 121.18974304199219, 124.89422607421875, 128.5987091064453, 132.30319213867188, 136.00767517089844, 139.712158203125, 143.4166259765625, 147.12110900878906, 150.82559204101562, 154.5300750732422, 158.23455810546875, 161.9390411376953, 165.64352416992188, 169.34799194335938, 173.052490234375]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 6.0, 8.0, 8.0, 2.0, 5.0, 9.0, 12.0, 13.0, 18.0, 23.0, 18.0, 22.0, 24.0, 22.0, 28.0, 38.0, 35.0, 46.0, 32.0, 37.0, 42.0, 44.0, 50.0, 43.0, 34.0, 39.0, 35.0, 36.0, 30.0, 36.0, 29.0, 30.0, 30.0, 21.0, 14.0, 15.0, 13.0, 13.0, 11.0, 7.0, 10.0, 3.0, 6.0, 6.0, 2.0, 4.0, 0.0, 1.0, 4.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-34.330711364746094, -33.250938415527344, -32.17116928100586, -31.09139633178711, -30.01162338256836, -28.931852340698242, -27.852081298828125, -26.772308349609375, -25.692535400390625, -24.612764358520508, -23.532991409301758, -22.45322036743164, -21.37344741821289, -20.293676376342773, -19.213905334472656, -18.134132385253906, -17.05436134338379, -15.974589347839355, -14.894817352294922, -13.815046310424805, -12.735273361206055, -11.655502319335938, -10.575730323791504, -9.49595832824707, -8.416186332702637, -7.336414337158203, -6.2566423416137695, -5.176870822906494, -4.0970988273620605, -3.017326831817627, -1.9375553131103516, -0.857783317565918, 0.22198867797851562, 1.3017605543136597, 2.3815324306488037, 3.461304187774658, 4.541076183319092, 5.620848178863525, 6.700619697570801, 7.780391693115234, 8.860163688659668, 9.939935684204102, 11.019707679748535, 12.099479675292969, 13.179250717163086, 14.259023666381836, 15.338794708251953, 16.418567657470703, 17.49833869934082, 18.578109741210938, 19.657882690429688, 20.737653732299805, 21.817426681518555, 22.897197723388672, 23.976970672607422, 25.05674171447754, 26.136512756347656, 27.216283798217773, 28.296056747436523, 29.37582778930664, 30.45560073852539, 31.535371780395508, 32.615142822265625, 33.694915771484375, 34.774688720703125]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 8.0, 6.0, 12.0, 11.0, 8.0, 16.0, 17.0, 18.0, 24.0, 22.0, 23.0, 18.0, 31.0, 41.0, 36.0, 36.0, 44.0, 37.0, 44.0, 46.0, 48.0, 34.0, 29.0, 57.0, 26.0, 36.0, 43.0, 28.0, 25.0, 23.0, 21.0, 30.0, 14.0, 21.0, 11.0, 18.0, 7.0, 4.0, 5.0, 4.0, 10.0, 2.0, 7.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.34375, -7.1334228515625, -6.923095703125, -6.7127685546875, -6.50244140625, -6.2921142578125, -6.081787109375, -5.8714599609375, -5.6611328125, -5.4508056640625, -5.240478515625, -5.0301513671875, -4.81982421875, -4.6094970703125, -4.399169921875, -4.1888427734375, -3.978515625, -3.7681884765625, -3.557861328125, -3.3475341796875, -3.13720703125, -2.9268798828125, -2.716552734375, -2.5062255859375, -2.2958984375, -2.0855712890625, -1.875244140625, -1.6649169921875, -1.45458984375, -1.2442626953125, -1.033935546875, -0.8236083984375, -0.61328125, -0.4029541015625, -0.192626953125, 0.0177001953125, 0.22802734375, 0.4383544921875, 0.648681640625, 0.8590087890625, 1.0693359375, 1.2796630859375, 1.489990234375, 1.7003173828125, 1.91064453125, 2.1209716796875, 2.331298828125, 2.5416259765625, 2.751953125, 2.9622802734375, 3.172607421875, 3.3829345703125, 3.59326171875, 3.8035888671875, 4.013916015625, 4.2242431640625, 4.4345703125, 4.6448974609375, 4.855224609375, 5.0655517578125, 5.27587890625, 5.4862060546875, 5.696533203125, 5.9068603515625, 6.1171875]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [5.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 8.0, 10.0, 14.0, 11.0, 16.0, 22.0, 26.0, 41.0, 35.0, 44.0, 59.0, 60.0, 77.0, 116.0, 156.0, 202.0, 224.0, 360.0, 490.0, 883.0, 1818.0, 6791.0, 81212.0, 3554881.0, 526849.0, 13834.0, 2762.0, 1058.0, 584.0, 403.0, 253.0, 202.0, 164.0, 126.0, 102.0, 79.0, 62.0, 58.0, 41.0, 34.0, 24.0, 14.0, 17.0, 15.0, 10.0, 9.0, 8.0, 7.0, 3.0, 4.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0], "bins": [-33.0625, -32.01904296875, -30.9755859375, -29.93212890625, -28.888671875, -27.84521484375, -26.8017578125, -25.75830078125, -24.71484375, -23.67138671875, -22.6279296875, -21.58447265625, -20.541015625, -19.49755859375, -18.4541015625, -17.41064453125, -16.3671875, -15.32373046875, -14.2802734375, -13.23681640625, -12.193359375, -11.14990234375, -10.1064453125, -9.06298828125, -8.01953125, -6.97607421875, -5.9326171875, -4.88916015625, -3.845703125, -2.80224609375, -1.7587890625, -0.71533203125, 0.328125, 1.37158203125, 2.4150390625, 3.45849609375, 4.501953125, 5.54541015625, 6.5888671875, 7.63232421875, 8.67578125, 9.71923828125, 10.7626953125, 11.80615234375, 12.849609375, 13.89306640625, 14.9365234375, 15.97998046875, 17.0234375, 18.06689453125, 19.1103515625, 20.15380859375, 21.197265625, 22.24072265625, 23.2841796875, 24.32763671875, 25.37109375, 26.41455078125, 27.4580078125, 28.50146484375, 29.544921875, 30.58837890625, 31.6318359375, 32.67529296875, 33.71875]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 3.0, 8.0, 17.0, 25.0, 86.0, 178.0, 488.0, 972.0, 1256.0, 597.0, 245.0, 104.0, 46.0, 16.0, 15.0, 5.0, 9.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-37.78125, -36.9447021484375, -36.108154296875, -35.2716064453125, -34.43505859375, -33.5985107421875, -32.761962890625, -31.9254150390625, -31.0888671875, -30.2523193359375, -29.415771484375, -28.5792236328125, -27.74267578125, -26.9061279296875, -26.069580078125, -25.2330322265625, -24.396484375, -23.5599365234375, -22.723388671875, -21.8868408203125, -21.05029296875, -20.2137451171875, -19.377197265625, -18.5406494140625, -17.7041015625, -16.8675537109375, -16.031005859375, -15.1944580078125, -14.35791015625, -13.5213623046875, -12.684814453125, -11.8482666015625, -11.01171875, -10.1751708984375, -9.338623046875, -8.5020751953125, -7.66552734375, -6.8289794921875, -5.992431640625, -5.1558837890625, -4.3193359375, -3.4827880859375, -2.646240234375, -1.8096923828125, -0.97314453125, -0.1365966796875, 0.699951171875, 1.5364990234375, 2.373046875, 3.2095947265625, 4.046142578125, 4.8826904296875, 5.71923828125, 6.5557861328125, 7.392333984375, 8.2288818359375, 9.0654296875, 9.9019775390625, 10.738525390625, 11.5750732421875, 12.41162109375, 13.2481689453125, 14.084716796875, 14.9212646484375, 15.7578125]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 4.0, 8.0, 15.0, 31.0, 43.0, 45.0, 89.0, 178.0, 535.0, 2273.0, 29930.0, 3812218.0, 340758.0, 6612.0, 933.0, 324.0, 117.0, 71.0, 37.0, 27.0, 16.0, 6.0, 4.0, 6.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-42.0625, -40.9482421875, -39.833984375, -38.7197265625, -37.60546875, -36.4912109375, -35.376953125, -34.2626953125, -33.1484375, -32.0341796875, -30.919921875, -29.8056640625, -28.69140625, -27.5771484375, -26.462890625, -25.3486328125, -24.234375, -23.1201171875, -22.005859375, -20.8916015625, -19.77734375, -18.6630859375, -17.548828125, -16.4345703125, -15.3203125, -14.2060546875, -13.091796875, -11.9775390625, -10.86328125, -9.7490234375, -8.634765625, -7.5205078125, -6.40625, -5.2919921875, -4.177734375, -3.0634765625, -1.94921875, -0.8349609375, 0.279296875, 1.3935546875, 2.5078125, 3.6220703125, 4.736328125, 5.8505859375, 6.96484375, 8.0791015625, 9.193359375, 10.3076171875, 11.421875, 12.5361328125, 13.650390625, 14.7646484375, 15.87890625, 16.9931640625, 18.107421875, 19.2216796875, 20.3359375, 21.4501953125, 22.564453125, 23.6787109375, 24.79296875, 25.9072265625, 27.021484375, 28.1357421875, 29.25]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [3.0, 2.0, 5.0, 2.0, 4.0, 7.0, 19.0, 26.0, 27.0, 70.0, 103.0, 123.0, 128.0, 137.0, 111.0, 83.0, 68.0, 34.0, 21.0, 21.0, 7.0, 5.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.160179138183594, -37.987518310546875, -34.814857482910156, -31.642200469970703, -28.469539642333984, -25.296878814697266, -22.12421989440918, -18.951560974121094, -15.778900146484375, -12.606240272521973, -9.43358039855957, -6.260920524597168, -3.0882606506347656, 0.08439922332763672, 3.257059097290039, 6.429718017578125, 9.602378845214844, 12.775038719177246, 15.947698593139648, 19.120357513427734, 22.293018341064453, 25.465679168701172, 28.638338088989258, 31.810997009277344, 34.98365783691406, 38.15631866455078, 41.3289794921875, 44.50163650512695, 47.67429733276367, 50.84695816040039, 54.019615173339844, 57.19227600097656, 60.36494445800781, 63.53760528564453, 66.71026611328125, 69.88292694091797, 73.05558776855469, 76.22824096679688, 79.4009017944336, 82.57356262207031, 85.74622344970703, 88.91888427734375, 92.09154510498047, 95.26420593261719, 98.43685913085938, 101.6095199584961, 104.78218078613281, 107.95484161376953, 111.12750244140625, 114.30016326904297, 117.47282409667969, 120.6454849243164, 123.81814575195312, 126.99079895019531, 130.16346740722656, 133.33612060546875, 136.5087890625, 139.6814422607422, 142.85411071777344, 146.02676391601562, 149.19943237304688, 152.37208557128906, 155.5447540283203, 158.7174072265625, 161.8900604248047]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 6.0, 5.0, 7.0, 5.0, 4.0, 9.0, 16.0, 20.0, 13.0, 24.0, 18.0, 24.0, 24.0, 34.0, 27.0, 30.0, 31.0, 29.0, 39.0, 34.0, 36.0, 44.0, 44.0, 39.0, 42.0, 35.0, 37.0, 31.0, 28.0, 38.0, 16.0, 31.0, 30.0, 24.0, 18.0, 13.0, 17.0, 13.0, 11.0, 16.0, 6.0, 8.0, 9.0, 3.0, 4.0, 3.0, 2.0, 4.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-40.422119140625, -39.09198760986328, -37.76185989379883, -36.43172836303711, -35.101600646972656, -33.77146911621094, -32.44133758544922, -31.111207962036133, -29.781078338623047, -28.45094871520996, -27.120819091796875, -25.790687561035156, -24.46055793762207, -23.130428314208984, -21.800296783447266, -20.47016716003418, -19.140037536621094, -17.809907913208008, -16.479778289794922, -15.149646759033203, -13.819517135620117, -12.489387512207031, -11.159256935119629, -9.829126358032227, -8.49899673461914, -7.1688666343688965, -5.838736534118652, -4.508606433868408, -3.178476333618164, -1.84834623336792, -0.5182161331176758, 0.8119144439697266, 2.1420440673828125, 3.4721741676330566, 4.802304267883301, 6.132434368133545, 7.462564468383789, 8.792694091796875, 10.122824668884277, 11.45295524597168, 12.783084869384766, 14.113214492797852, 15.443345069885254, 16.773475646972656, 18.103605270385742, 19.433734893798828, 20.763866424560547, 22.093996047973633, 23.42412567138672, 24.754255294799805, 26.08438491821289, 27.41451644897461, 28.744646072387695, 30.07477569580078, 31.4049072265625, 32.73503875732422, 34.06516647338867, 35.39529800415039, 36.725425720214844, 38.05555725097656, 39.38568878173828, 40.715816497802734, 42.04594802856445, 43.376075744628906, 44.706207275390625]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 3.0, 6.0, 3.0, 9.0, 7.0, 5.0, 12.0, 11.0, 16.0, 9.0, 14.0, 13.0, 19.0, 27.0, 36.0, 33.0, 29.0, 28.0, 42.0, 42.0, 39.0, 29.0, 42.0, 44.0, 50.0, 42.0, 40.0, 27.0, 36.0, 29.0, 27.0, 30.0, 28.0, 24.0, 26.0, 17.0, 9.0, 16.0, 19.0, 12.0, 9.0, 8.0, 11.0, 5.0, 4.0, 3.0, 8.0, 5.0, 3.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-75.125, -72.7626953125, -70.400390625, -68.0380859375, -65.67578125, -63.3134765625, -60.951171875, -58.5888671875, -56.2265625, -53.8642578125, -51.501953125, -49.1396484375, -46.77734375, -44.4150390625, -42.052734375, -39.6904296875, -37.328125, -34.9658203125, -32.603515625, -30.2412109375, -27.87890625, -25.5166015625, -23.154296875, -20.7919921875, -18.4296875, -16.0673828125, -13.705078125, -11.3427734375, -8.98046875, -6.6181640625, -4.255859375, -1.8935546875, 0.46875, 2.8310546875, 5.193359375, 7.5556640625, 9.91796875, 12.2802734375, 14.642578125, 17.0048828125, 19.3671875, 21.7294921875, 24.091796875, 26.4541015625, 28.81640625, 31.1787109375, 33.541015625, 35.9033203125, 38.265625, 40.6279296875, 42.990234375, 45.3525390625, 47.71484375, 50.0771484375, 52.439453125, 54.8017578125, 57.1640625, 59.5263671875, 61.888671875, 64.2509765625, 66.61328125, 68.9755859375, 71.337890625, 73.7001953125, 76.0625]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 8.0, 4.0, 13.0, 14.0, 28.0, 37.0, 66.0, 104.0, 159.0, 246.0, 406.0, 572.0, 929.0, 1429.0, 2098.0, 3379.0, 5069.0, 7840.0, 12261.0, 18763.0, 29532.0, 46597.0, 72496.0, 108444.0, 148386.0, 167116.0, 140643.0, 99082.0, 65315.0, 42101.0, 26727.0, 17218.0, 11175.0, 7108.0, 4573.0, 3042.0, 1982.0, 1272.0, 808.0, 547.0, 368.0, 223.0, 152.0, 90.0, 53.0, 36.0, 26.0, 11.0, 7.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-6.0625, -5.88092041015625, -5.6993408203125, -5.51776123046875, -5.336181640625, -5.15460205078125, -4.9730224609375, -4.79144287109375, -4.60986328125, -4.42828369140625, -4.2467041015625, -4.06512451171875, -3.883544921875, -3.70196533203125, -3.5203857421875, -3.33880615234375, -3.1572265625, -2.97564697265625, -2.7940673828125, -2.61248779296875, -2.430908203125, -2.24932861328125, -2.0677490234375, -1.88616943359375, -1.70458984375, -1.52301025390625, -1.3414306640625, -1.15985107421875, -0.978271484375, -0.79669189453125, -0.6151123046875, -0.43353271484375, -0.251953125, -0.07037353515625, 0.1112060546875, 0.29278564453125, 0.474365234375, 0.65594482421875, 0.8375244140625, 1.01910400390625, 1.20068359375, 1.38226318359375, 1.5638427734375, 1.74542236328125, 1.927001953125, 2.10858154296875, 2.2901611328125, 2.47174072265625, 2.6533203125, 2.83489990234375, 3.0164794921875, 3.19805908203125, 3.379638671875, 3.56121826171875, 3.7427978515625, 3.92437744140625, 4.10595703125, 4.28753662109375, 4.4691162109375, 4.65069580078125, 4.832275390625, 5.01385498046875, 5.1954345703125, 5.37701416015625, 5.55859375]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 4.0, 8.0, 4.0, 11.0, 9.0, 8.0, 15.0, 27.0, 24.0, 25.0, 25.0, 24.0, 29.0, 26.0, 36.0, 41.0, 55.0, 30.0, 42.0, 49.0, 1066.0, 43.0, 39.0, 35.0, 30.0, 22.0, 46.0, 38.0, 33.0, 24.0, 26.0, 18.0, 11.0, 20.0, 15.0, 12.0, 10.0, 7.0, 11.0, 8.0, 6.0, 3.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-52.875, -51.2802734375, -49.685546875, -48.0908203125, -46.49609375, -44.9013671875, -43.306640625, -41.7119140625, -40.1171875, -38.5224609375, -36.927734375, -35.3330078125, -33.73828125, -32.1435546875, -30.548828125, -28.9541015625, -27.359375, -25.7646484375, -24.169921875, -22.5751953125, -20.98046875, -19.3857421875, -17.791015625, -16.1962890625, -14.6015625, -13.0068359375, -11.412109375, -9.8173828125, -8.22265625, -6.6279296875, -5.033203125, -3.4384765625, -1.84375, -0.2490234375, 1.345703125, 2.9404296875, 4.53515625, 6.1298828125, 7.724609375, 9.3193359375, 10.9140625, 12.5087890625, 14.103515625, 15.6982421875, 17.29296875, 18.8876953125, 20.482421875, 22.0771484375, 23.671875, 25.2666015625, 26.861328125, 28.4560546875, 30.05078125, 31.6455078125, 33.240234375, 34.8349609375, 36.4296875, 38.0244140625, 39.619140625, 41.2138671875, 42.80859375, 44.4033203125, 45.998046875, 47.5927734375, 49.1875]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 1.0, 9.0, 7.0, 17.0, 28.0, 35.0, 57.0, 74.0, 119.0, 196.0, 314.0, 503.0, 693.0, 1133.0, 1799.0, 2854.0, 4552.0, 7190.0, 11324.0, 17975.0, 28865.0, 46365.0, 73301.0, 112166.0, 153878.0, 1216529.0, 142627.0, 100577.0, 64647.0, 40615.0, 25373.0, 15975.0, 9990.0, 6432.0, 4018.0, 2628.0, 1563.0, 955.0, 615.0, 380.0, 271.0, 150.0, 114.0, 83.0, 53.0, 34.0, 16.0, 15.0, 5.0, 4.0, 3.0, 5.0, 1.0, 1.0, 4.0, 2.0, 0.0, 1.0], "bins": [-5.640625, -5.46075439453125, -5.2808837890625, -5.10101318359375, -4.921142578125, -4.74127197265625, -4.5614013671875, -4.38153076171875, -4.20166015625, -4.02178955078125, -3.8419189453125, -3.66204833984375, -3.482177734375, -3.30230712890625, -3.1224365234375, -2.94256591796875, -2.7626953125, -2.58282470703125, -2.4029541015625, -2.22308349609375, -2.043212890625, -1.86334228515625, -1.6834716796875, -1.50360107421875, -1.32373046875, -1.14385986328125, -0.9639892578125, -0.78411865234375, -0.604248046875, -0.42437744140625, -0.2445068359375, -0.06463623046875, 0.115234375, 0.29510498046875, 0.4749755859375, 0.65484619140625, 0.834716796875, 1.01458740234375, 1.1944580078125, 1.37432861328125, 1.55419921875, 1.73406982421875, 1.9139404296875, 2.09381103515625, 2.273681640625, 2.45355224609375, 2.6334228515625, 2.81329345703125, 2.9931640625, 3.17303466796875, 3.3529052734375, 3.53277587890625, 3.712646484375, 3.89251708984375, 4.0723876953125, 4.25225830078125, 4.43212890625, 4.61199951171875, 4.7918701171875, 4.97174072265625, 5.151611328125, 5.33148193359375, 5.5113525390625, 5.69122314453125, 5.87109375]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 3.0, 5.0, 6.0, 6.0, 6.0, 6.0, 9.0, 10.0, 10.0, 20.0, 13.0, 22.0, 47.0, 23.0, 37.0, 44.0, 47.0, 70.0, 69.0, 70.0, 74.0, 62.0, 54.0, 52.0, 44.0, 28.0, 28.0, 27.0, 26.0, 14.0, 11.0, 9.0, 13.0, 8.0, 1.0, 5.0, 0.0, 5.0, 4.0, 2.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.04443359375, -0.042922019958496094, -0.04141044616699219, -0.03989887237548828, -0.038387298583984375, -0.03687572479248047, -0.03536415100097656, -0.033852577209472656, -0.03234100341796875, -0.030829429626464844, -0.029317855834960938, -0.02780628204345703, -0.026294708251953125, -0.02478313446044922, -0.023271560668945312, -0.021759986877441406, -0.0202484130859375, -0.018736839294433594, -0.017225265502929688, -0.01571369171142578, -0.014202117919921875, -0.012690544128417969, -0.011178970336914062, -0.009667396545410156, -0.00815582275390625, -0.006644248962402344, -0.0051326751708984375, -0.0036211013793945312, -0.002109527587890625, -0.0005979537963867188, 0.0009136199951171875, 0.0024251937866210938, 0.003936767578125, 0.005448341369628906, 0.0069599151611328125, 0.008471488952636719, 0.009983062744140625, 0.011494636535644531, 0.013006210327148438, 0.014517784118652344, 0.01602935791015625, 0.017540931701660156, 0.019052505493164062, 0.02056407928466797, 0.022075653076171875, 0.02358722686767578, 0.025098800659179688, 0.026610374450683594, 0.0281219482421875, 0.029633522033691406, 0.031145095825195312, 0.03265666961669922, 0.034168243408203125, 0.03567981719970703, 0.03719139099121094, 0.038702964782714844, 0.04021453857421875, 0.041726112365722656, 0.04323768615722656, 0.04474925994873047, 0.046260833740234375, 0.04777240753173828, 0.04928398132324219, 0.050795555114746094, 0.05230712890625]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 6.0, 3.0, 5.0, 11.0, 9.0, 11.0, 18.0, 17.0, 21.0, 31.0, 50.0, 55.0, 70.0, 96.0, 133.0, 171.0, 204.0, 337.0, 590.0, 978.0, 1908.0, 4782.0, 14837.0, 56362.0, 258210.0, 515524.0, 144019.0, 33524.0, 9401.0, 3306.0, 1484.0, 791.0, 458.0, 312.0, 179.0, 145.0, 131.0, 86.0, 68.0, 54.0, 34.0, 36.0, 22.0, 10.0, 16.0, 11.0, 8.0, 5.0, 10.0, 2.0, 4.0, 3.0, 0.0, 4.0, 1.0], "bins": [-0.31689453125, -0.3076591491699219, -0.29842376708984375, -0.2891883850097656, -0.2799530029296875, -0.2707176208496094, -0.26148223876953125, -0.2522468566894531, -0.243011474609375, -0.23377609252929688, -0.22454071044921875, -0.21530532836914062, -0.2060699462890625, -0.19683456420898438, -0.18759918212890625, -0.17836380004882812, -0.16912841796875, -0.15989303588867188, -0.15065765380859375, -0.14142227172851562, -0.1321868896484375, -0.12295150756835938, -0.11371612548828125, -0.10448074340820312, -0.095245361328125, -0.08600997924804688, -0.07677459716796875, -0.06753921508789062, -0.0583038330078125, -0.049068450927734375, -0.03983306884765625, -0.030597686767578125, -0.0213623046875, -0.012126922607421875, -0.00289154052734375, 0.006343841552734375, 0.0155792236328125, 0.024814605712890625, 0.03404998779296875, 0.043285369873046875, 0.052520751953125, 0.061756134033203125, 0.07099151611328125, 0.08022689819335938, 0.0894622802734375, 0.09869766235351562, 0.10793304443359375, 0.11716842651367188, 0.12640380859375, 0.13563919067382812, 0.14487457275390625, 0.15410995483398438, 0.1633453369140625, 0.17258071899414062, 0.18181610107421875, 0.19105148315429688, 0.200286865234375, 0.20952224731445312, 0.21875762939453125, 0.22799301147460938, 0.2372283935546875, 0.24646377563476562, 0.25569915771484375, 0.2649345397949219, 0.274169921875]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 10.0, 37.0, 55.0, 102.0, 175.0, 196.0, 144.0, 99.0, 70.0, 39.0, 24.0, 12.0, 14.0, 6.0, 9.0, 3.0, 1.0, 3.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.04953237250447273, -0.04664928838610649, -0.04376620054244995, -0.04088311642408371, -0.03800003230571747, -0.03511694818735123, -0.03223386034369469, -0.029350776225328445, -0.026467690244317055, -0.023584604263305664, -0.020701520144939423, -0.017818434163928032, -0.014935349114239216, -0.0120522640645504, -0.009169178083539009, -0.006286093965172768, -0.003403007984161377, -0.0005199227016419172, 0.0023631625808775425, 0.005246248096227646, 0.008129333145916462, 0.011012418195605278, 0.013895504176616669, 0.01677858829498291, 0.0196616742759943, 0.02254476025700569, 0.025427844375371933, 0.028310930356383324, 0.031194016337394714, 0.034077100455760956, 0.0369601845741272, 0.03984326869249344, 0.04272636026144028, 0.04560944437980652, 0.04849253222346306, 0.0513756163418293, 0.05425870046019554, 0.05714178830385208, 0.06002487242221832, 0.06290795654058456, 0.0657910406589508, 0.06867412477731705, 0.07155720889568329, 0.07444030046463013, 0.07732338458299637, 0.08020646870136261, 0.08308955281972885, 0.08597263693809509, 0.08885572850704193, 0.09173881262540817, 0.09462189674377441, 0.09750498831272125, 0.1003880724310875, 0.10327115654945374, 0.10615424066781998, 0.10903732478618622, 0.11192040890455246, 0.1148034930229187, 0.11768657714128494, 0.12056966125965118, 0.12345275282859802, 0.12633582949638367, 0.1292189210653305, 0.13210201263427734, 0.134985089302063]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 5.0, 10.0, 4.0, 5.0, 10.0, 7.0, 8.0, 12.0, 12.0, 18.0, 23.0, 11.0, 10.0, 27.0, 23.0, 28.0, 38.0, 37.0, 31.0, 40.0, 32.0, 29.0, 51.0, 34.0, 37.0, 44.0, 25.0, 43.0, 47.0, 28.0, 39.0, 30.0, 23.0, 26.0, 22.0, 24.0, 21.0, 17.0, 20.0, 9.0, 12.0, 7.0, 9.0, 5.0, 7.0, 1.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.03220796585083008, -0.03122302144765854, -0.03023807890713215, -0.02925313636660576, -0.02826819196343422, -0.02728324756026268, -0.02629830501973629, -0.0253133624792099, -0.02432841807603836, -0.02334347367286682, -0.02235853113234043, -0.02137358859181404, -0.020388644188642502, -0.019403699785470963, -0.018418757244944572, -0.017433814704418182, -0.016448870301246643, -0.015463926829397678, -0.014478983357548714, -0.013494039885699749, -0.012509096413850784, -0.01152415294200182, -0.010539209470152855, -0.00955426599830389, -0.008569322526454926, -0.007584379054605961, -0.006599435582756996, -0.0056144921109080315, -0.004629548639059067, -0.003644605167210102, -0.0026596616953611374, -0.0016747182235121727, -0.000689774751663208, 0.0002951687201857567, 0.0012801121920347214, 0.002265055663883686, 0.0032499991357326508, 0.0042349426075816154, 0.00521988607943058, 0.006204829551279545, 0.0071897730231285095, 0.008174716494977474, 0.009159659966826439, 0.010144603438675404, 0.011129546910524368, 0.012114490382373333, 0.013099433854222298, 0.014084377326071262, 0.015069320797920227, 0.016054265201091766, 0.017039207741618156, 0.018024150282144547, 0.019009094685316086, 0.019994039088487625, 0.020978981629014015, 0.021963924169540405, 0.022948868572711945, 0.023933812975883484, 0.024918755516409874, 0.025903698056936264, 0.026888642460107803, 0.027873586863279343, 0.028858529403805733, 0.029843471944332123, 0.030828416347503662]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 3.0, 6.0, 3.0, 9.0, 6.0, 6.0, 12.0, 11.0, 16.0, 9.0, 14.0, 13.0, 20.0, 27.0, 37.0, 30.0, 29.0, 29.0, 41.0, 43.0, 39.0, 30.0, 43.0, 42.0, 49.0, 42.0, 41.0, 26.0, 37.0, 28.0, 29.0, 31.0, 26.0, 24.0, 23.0, 19.0, 10.0, 16.0, 20.0, 11.0, 9.0, 9.0, 10.0, 4.0, 5.0, 3.0, 9.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-75.0625, -72.7021484375, -70.341796875, -67.9814453125, -65.62109375, -63.2607421875, -60.900390625, -58.5400390625, -56.1796875, -53.8193359375, -51.458984375, -49.0986328125, -46.73828125, -44.3779296875, -42.017578125, -39.6572265625, -37.296875, -34.9365234375, -32.576171875, -30.2158203125, -27.85546875, -25.4951171875, -23.134765625, -20.7744140625, -18.4140625, -16.0537109375, -13.693359375, -11.3330078125, -8.97265625, -6.6123046875, -4.251953125, -1.8916015625, 0.46875, 2.8291015625, 5.189453125, 7.5498046875, 9.91015625, 12.2705078125, 14.630859375, 16.9912109375, 19.3515625, 21.7119140625, 24.072265625, 26.4326171875, 28.79296875, 31.1533203125, 33.513671875, 35.8740234375, 38.234375, 40.5947265625, 42.955078125, 45.3154296875, 47.67578125, 50.0361328125, 52.396484375, 54.7568359375, 57.1171875, 59.4775390625, 61.837890625, 64.1982421875, 66.55859375, 68.9189453125, 71.279296875, 73.6396484375, 76.0]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 5.0, 11.0, 5.0, 11.0, 17.0, 19.0, 24.0, 39.0, 45.0, 77.0, 88.0, 177.0, 253.0, 373.0, 689.0, 1233.0, 2272.0, 4740.0, 11699.0, 37529.0, 180240.0, 593883.0, 160095.0, 34364.0, 11073.0, 4484.0, 2155.0, 1191.0, 621.0, 400.0, 214.0, 161.0, 102.0, 83.0, 52.0, 27.0, 21.0, 26.0, 13.0, 17.0, 6.0, 6.0, 6.0, 2.0, 5.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.078125, -16.517578125, -15.95703125, -15.396484375, -14.8359375, -14.275390625, -13.71484375, -13.154296875, -12.59375, -12.033203125, -11.47265625, -10.912109375, -10.3515625, -9.791015625, -9.23046875, -8.669921875, -8.109375, -7.548828125, -6.98828125, -6.427734375, -5.8671875, -5.306640625, -4.74609375, -4.185546875, -3.625, -3.064453125, -2.50390625, -1.943359375, -1.3828125, -0.822265625, -0.26171875, 0.298828125, 0.859375, 1.419921875, 1.98046875, 2.541015625, 3.1015625, 3.662109375, 4.22265625, 4.783203125, 5.34375, 5.904296875, 6.46484375, 7.025390625, 7.5859375, 8.146484375, 8.70703125, 9.267578125, 9.828125, 10.388671875, 10.94921875, 11.509765625, 12.0703125, 12.630859375, 13.19140625, 13.751953125, 14.3125, 14.873046875, 15.43359375, 15.994140625, 16.5546875, 17.115234375, 17.67578125, 18.236328125, 18.796875]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 6.0, 7.0, 7.0, 12.0, 11.0, 28.0, 29.0, 28.0, 36.0, 48.0, 56.0, 58.0, 72.0, 87.0, 2128.0, 75.0, 79.0, 54.0, 41.0, 39.0, 26.0, 25.0, 19.0, 15.0, 12.0, 7.0, 9.0, 10.0, 5.0, 5.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-175.5, -168.85546875, -162.2109375, -155.56640625, -148.921875, -142.27734375, -135.6328125, -128.98828125, -122.34375, -115.69921875, -109.0546875, -102.41015625, -95.765625, -89.12109375, -82.4765625, -75.83203125, -69.1875, -62.54296875, -55.8984375, -49.25390625, -42.609375, -35.96484375, -29.3203125, -22.67578125, -16.03125, -9.38671875, -2.7421875, 3.90234375, 10.546875, 17.19140625, 23.8359375, 30.48046875, 37.125, 43.76953125, 50.4140625, 57.05859375, 63.703125, 70.34765625, 76.9921875, 83.63671875, 90.28125, 96.92578125, 103.5703125, 110.21484375, 116.859375, 123.50390625, 130.1484375, 136.79296875, 143.4375, 150.08203125, 156.7265625, 163.37109375, 170.015625, 176.66015625, 183.3046875, 189.94921875, 196.59375, 203.23828125, 209.8828125, 216.52734375, 223.171875, 229.81640625, 236.4609375, 243.10546875, 249.75]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 4.0, 4.0, 4.0, 4.0, 0.0, 8.0, 8.0, 13.0, 17.0, 11.0, 28.0, 36.0, 52.0, 81.0, 98.0, 194.0, 242.0, 409.0, 872.0, 2214.0, 9776.0, 165203.0, 2922826.0, 36072.0, 4461.0, 1384.0, 683.0, 351.0, 192.0, 143.0, 89.0, 70.0, 41.0, 27.0, 27.0, 22.0, 8.0, 10.0, 4.0, 7.0, 5.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0], "bins": [-50.84375, -49.44189453125, -48.0400390625, -46.63818359375, -45.236328125, -43.83447265625, -42.4326171875, -41.03076171875, -39.62890625, -38.22705078125, -36.8251953125, -35.42333984375, -34.021484375, -32.61962890625, -31.2177734375, -29.81591796875, -28.4140625, -27.01220703125, -25.6103515625, -24.20849609375, -22.806640625, -21.40478515625, -20.0029296875, -18.60107421875, -17.19921875, -15.79736328125, -14.3955078125, -12.99365234375, -11.591796875, -10.18994140625, -8.7880859375, -7.38623046875, -5.984375, -4.58251953125, -3.1806640625, -1.77880859375, -0.376953125, 1.02490234375, 2.4267578125, 3.82861328125, 5.23046875, 6.63232421875, 8.0341796875, 9.43603515625, 10.837890625, 12.23974609375, 13.6416015625, 15.04345703125, 16.4453125, 17.84716796875, 19.2490234375, 20.65087890625, 22.052734375, 23.45458984375, 24.8564453125, 26.25830078125, 27.66015625, 29.06201171875, 30.4638671875, 31.86572265625, 33.267578125, 34.66943359375, 36.0712890625, 37.47314453125, 38.875]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 7.0, 16.0, 31.0, 142.0, 460.0, 242.0, 76.0, 22.0, 8.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-918.1880493164062, -899.7416381835938, -881.2952270507812, -862.8488159179688, -844.4024658203125, -825.9560546875, -807.5096435546875, -789.063232421875, -770.6168212890625, -752.17041015625, -733.7239990234375, -715.277587890625, -696.8311767578125, -678.3848266601562, -659.9384155273438, -641.4920043945312, -623.0455932617188, -604.5991821289062, -586.1527709960938, -567.7063598632812, -549.260009765625, -530.8135986328125, -512.3671875, -493.9207763671875, -475.474365234375, -457.0279541015625, -438.58154296875, -420.1351623535156, -401.6887512207031, -383.2423400878906, -364.79595947265625, -346.34954833984375, -327.9031677246094, -309.4567565917969, -291.0103759765625, -272.56396484375, -254.1175537109375, -235.671142578125, -217.22474670410156, -198.77835083007812, -180.33193969726562, -161.88552856445312, -143.4391326904297, -124.99272918701172, -106.54632568359375, -88.09992218017578, -69.65351867675781, -51.207122802734375, -32.760711669921875, -14.314308166503906, 4.1320953369140625, 22.57849884033203, 41.02490234375, 59.47130584716797, 77.91770935058594, 96.36410522460938, 114.81051635742188, 133.25692749023438, 151.7033233642578, 170.14971923828125, 188.59613037109375, 207.04254150390625, 225.4889373779297, 243.93533325195312, 262.3817443847656]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 6.0, 3.0, 2.0, 1.0, 3.0, 2.0, 6.0, 13.0, 15.0, 8.0, 25.0, 15.0, 22.0, 33.0, 29.0, 30.0, 34.0, 38.0, 49.0, 40.0, 51.0, 61.0, 55.0, 46.0, 62.0, 57.0, 44.0, 37.0, 44.0, 33.0, 24.0, 23.0, 18.0, 14.0, 16.0, 8.0, 13.0, 9.0, 2.0, 4.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-227.23028564453125, -220.158935546875, -213.08758544921875, -206.01622009277344, -198.9448699951172, -191.87351989746094, -184.80215454101562, -177.73080444335938, -170.65945434570312, -163.58810424804688, -156.51675415039062, -149.4453887939453, -142.37403869628906, -135.3026885986328, -128.2313232421875, -121.15997314453125, -114.088623046875, -107.01727294921875, -99.94591522216797, -92.87455749511719, -85.80320739746094, -78.73185729980469, -71.6604995727539, -64.58914184570312, -57.517791748046875, -50.44643783569336, -43.375083923339844, -36.30373001098633, -29.232376098632812, -22.161022186279297, -15.089668273925781, -8.018314361572266, -0.94696044921875, 6.124393463134766, 13.195747375488281, 20.267101287841797, 27.338455200195312, 34.40980911254883, 41.481163024902344, 48.55251693725586, 55.623870849609375, 62.69522476196289, 69.7665786743164, 76.83793640136719, 83.90928649902344, 90.98063659667969, 98.05199432373047, 105.12335205078125, 112.1947021484375, 119.26605224609375, 126.33740997314453, 133.4087677001953, 140.48011779785156, 147.5514678955078, 154.62283325195312, 161.69418334960938, 168.76553344726562, 175.83688354492188, 182.90823364257812, 189.97959899902344, 197.0509490966797, 204.12229919433594, 211.19366455078125, 218.2650146484375, 225.33636474609375]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 4.0, 3.0, 8.0, 7.0, 9.0, 8.0, 9.0, 11.0, 11.0, 22.0, 41.0, 39.0, 61.0, 71.0, 89.0, 122.0, 194.0, 245.0, 342.0, 435.0, 602.0, 744.0, 1239.0, 1040828.0, 802.0, 677.0, 506.0, 347.0, 305.0, 194.0, 146.0, 116.0, 75.0, 61.0, 40.0, 40.0, 24.0, 20.0, 14.0, 18.0, 12.0, 9.0, 7.0, 5.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.662567138671875, -42.0578727722168, -40.453182220458984, -38.848487854003906, -37.243797302246094, -35.639102935791016, -34.03440856933594, -32.429718017578125, -30.82502555847168, -29.220333099365234, -27.61564064025879, -26.010948181152344, -24.406253814697266, -22.801563262939453, -21.196868896484375, -19.59217643737793, -17.987483978271484, -16.38279151916504, -14.778099060058594, -13.173405647277832, -11.568713188171387, -9.964020729064941, -8.35932731628418, -6.754634857177734, -5.149942398071289, -3.5452497005462646, -1.9405570030212402, -0.3358640670776367, 1.2688283920288086, 2.873520851135254, 4.478214263916016, 6.082906723022461, 7.687602996826172, 9.292295455932617, 10.896987915039062, 12.501681327819824, 14.10637378692627, 15.711066246032715, 17.315759658813477, 18.920452117919922, 20.525144577026367, 22.129837036132812, 23.734529495239258, 25.339221954345703, 26.94391632080078, 28.548606872558594, 30.153301239013672, 31.757993698120117, 33.36268615722656, 34.96738052368164, 36.57207107543945, 38.17676544189453, 39.781455993652344, 41.38615036010742, 42.9908447265625, 44.59553527832031, 46.200225830078125, 47.8049201965332, 49.409610748291016, 51.014305114746094, 52.618995666503906, 54.223690032958984, 55.82838439941406, 57.433074951171875, 59.03776931762695]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 6.0, 5.0, 14.0, 14.0, 14.0, 21.0, 63.0, 447.0, 51462376.0, 120.0, 20.0, 14.0, 8.0, 8.0, 4.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3986.817138671875, -3800.021240234375, -3613.225341796875, -3426.4296875, -3239.6337890625, -3052.837890625, -2866.0419921875, -2679.24609375, -2492.4501953125, -2305.654296875, -2118.8583984375, -1932.0626220703125, -1745.2667236328125, -1558.4708251953125, -1371.675048828125, -1184.879150390625, -998.083251953125, -811.287353515625, -624.4915161132812, -437.6956787109375, -250.8997802734375, -64.1038818359375, 122.69189453125, 309.48779296875, 496.28369140625, 683.07958984375, 869.8754272460938, 1056.6712646484375, 1243.4671630859375, 1430.2630615234375, 1617.058837890625, 1803.854736328125, 1990.650390625, 2177.4462890625, 2364.2421875, 2551.0380859375, 2737.833984375, 2924.6298828125, 3111.425537109375, 3298.221435546875, 3485.017333984375, 3671.813232421875, 3858.609130859375, 4045.40478515625, 4232.20068359375, 4418.99658203125, 4605.79248046875, 4792.58837890625, 4979.38427734375, 5166.18017578125, 5352.97607421875, 5539.77197265625, 5726.56787109375, 5913.36376953125, 6100.1591796875, 6286.955078125, 6473.7509765625, 6660.546875, 6847.3427734375, 7034.138671875, 7220.9345703125, 7407.73046875, 7594.5263671875, 7781.322265625, 7968.1181640625]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 2.0, 7.0, 9.0, 13.0, 27.0, 37.0, 49.0, 70.0, 100.0, 133.0, 213.0, 350.0, 514.0, 769.0, 1206.0, 1771.0, 2622.0, 3765.0, 5422.0, 8543.0, 12433.0, 18256.0, 27801.0, 41151.0, 60176.0, 89086.0, 129959.0, 185002.0, 254876.0, 332189.0, 1713375.0, 2200863.0, 338229.0, 260509.0, 188864.0, 131972.0, 91061.0, 61354.0, 42275.0, 28225.0, 19191.0, 12790.0, 8643.0, 5723.0, 3904.0, 2545.0, 1769.0, 1220.0, 815.0, 558.0, 354.0, 225.0, 157.0, 90.0, 70.0, 46.0, 36.0, 15.0, 11.0, 6.0, 4.0, 2.0, 2.0], "bins": [-1.7490234375, -1.6944122314453125, -1.639801025390625, -1.5851898193359375, -1.53057861328125, -1.4759674072265625, -1.421356201171875, -1.3667449951171875, -1.3121337890625, -1.2575225830078125, -1.202911376953125, -1.1483001708984375, -1.09368896484375, -1.0390777587890625, -0.984466552734375, -0.9298553466796875, -0.875244140625, -0.8206329345703125, -0.766021728515625, -0.7114105224609375, -0.65679931640625, -0.6021881103515625, -0.547576904296875, -0.4929656982421875, -0.4383544921875, -0.3837432861328125, -0.329132080078125, -0.2745208740234375, -0.21990966796875, -0.1652984619140625, -0.110687255859375, -0.0560760498046875, -0.00146484375, 0.0531463623046875, 0.107757568359375, 0.1623687744140625, 0.21697998046875, 0.2715911865234375, 0.326202392578125, 0.3808135986328125, 0.4354248046875, 0.4900360107421875, 0.544647216796875, 0.5992584228515625, 0.65386962890625, 0.7084808349609375, 0.763092041015625, 0.8177032470703125, 0.872314453125, 0.9269256591796875, 0.981536865234375, 1.0361480712890625, 1.09075927734375, 1.1453704833984375, 1.199981689453125, 1.2545928955078125, 1.3092041015625, 1.3638153076171875, 1.418426513671875, 1.4730377197265625, 1.52764892578125, 1.5822601318359375, 1.636871337890625, 1.6914825439453125, 1.74609375]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 5.0, 2.0, 3.0, 1.0, 4.0, 4.0, 10.0, 10.0, 6.0, 17.0, 16.0, 17.0, 16.0, 24.0, 20.0, 27.0, 33.0, 35.0, 32.0, 28.0, 40.0, 46.0, 50.0, 70.0, 836.0, 231.0, 36.0, 35.0, 39.0, 40.0, 37.0, 31.0, 36.0, 27.0, 25.0, 31.0, 19.0, 11.0, 13.0, 19.0, 11.0, 8.0, 9.0, 9.0, 7.0, 5.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-15.7734375, -15.2247314453125, -14.676025390625, -14.1273193359375, -13.57861328125, -13.0299072265625, -12.481201171875, -11.9324951171875, -11.3837890625, -10.8350830078125, -10.286376953125, -9.7376708984375, -9.18896484375, -8.6402587890625, -8.091552734375, -7.5428466796875, -6.994140625, -6.4454345703125, -5.896728515625, -5.3480224609375, -4.79931640625, -4.2506103515625, -3.701904296875, -3.1531982421875, -2.6044921875, -2.0557861328125, -1.507080078125, -0.9583740234375, -0.40966796875, 0.1390380859375, 0.687744140625, 1.2364501953125, 1.78515625, 2.3338623046875, 2.882568359375, 3.4312744140625, 3.97998046875, 4.5286865234375, 5.077392578125, 5.6260986328125, 6.1748046875, 6.7235107421875, 7.272216796875, 7.8209228515625, 8.36962890625, 8.9183349609375, 9.467041015625, 10.0157470703125, 10.564453125, 11.1131591796875, 11.661865234375, 12.2105712890625, 12.75927734375, 13.3079833984375, 13.856689453125, 14.4053955078125, 14.9541015625, 15.5028076171875, 16.051513671875, 16.6002197265625, 17.14892578125, 17.6976318359375, 18.246337890625, 18.7950439453125, 19.34375]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [3.0, 4.0, 5.0, 12.0, 6.0, 12.0, 22.0, 29.0, 51.0, 78.0, 114.0, 185.0, 254.0, 424.0, 682.0, 989.0, 1596.0, 2346.0, 3884.0, 6258.0, 9752.0, 15404.0, 24459.0, 40082.0, 63522.0, 101047.0, 159392.0, 238721.0, 339788.0, 600532.0, 3405163.0, 412485.0, 300125.0, 204884.0, 134118.0, 84283.0, 52967.0, 32496.0, 20471.0, 12875.0, 7941.0, 5065.0, 3166.0, 1998.0, 1298.0, 838.0, 571.0, 355.0, 250.0, 153.0, 95.0, 70.0, 48.0, 32.0, 18.0, 16.0, 8.0, 5.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0], "bins": [-1.9287109375, -1.8650665283203125, -1.801422119140625, -1.7377777099609375, -1.67413330078125, -1.6104888916015625, -1.546844482421875, -1.4832000732421875, -1.4195556640625, -1.3559112548828125, -1.292266845703125, -1.2286224365234375, -1.16497802734375, -1.1013336181640625, -1.037689208984375, -0.9740447998046875, -0.910400390625, -0.8467559814453125, -0.783111572265625, -0.7194671630859375, -0.65582275390625, -0.5921783447265625, -0.528533935546875, -0.4648895263671875, -0.4012451171875, -0.3376007080078125, -0.273956298828125, -0.2103118896484375, -0.14666748046875, -0.0830230712890625, -0.019378662109375, 0.0442657470703125, 0.10791015625, 0.1715545654296875, 0.235198974609375, 0.2988433837890625, 0.36248779296875, 0.4261322021484375, 0.489776611328125, 0.5534210205078125, 0.6170654296875, 0.6807098388671875, 0.744354248046875, 0.8079986572265625, 0.87164306640625, 0.9352874755859375, 0.998931884765625, 1.0625762939453125, 1.126220703125, 1.1898651123046875, 1.253509521484375, 1.3171539306640625, 1.38079833984375, 1.4444427490234375, 1.508087158203125, 1.5717315673828125, 1.6353759765625, 1.6990203857421875, 1.762664794921875, 1.8263092041015625, 1.88995361328125, 1.9535980224609375, 2.017242431640625, 2.0808868408203125, 2.14453125]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 7.0, 7.0, 4.0, 9.0, 10.0, 6.0, 12.0, 15.0, 12.0, 25.0, 15.0, 28.0, 20.0, 20.0, 36.0, 31.0, 37.0, 33.0, 33.0, 34.0, 42.0, 68.0, 738.0, 314.0, 40.0, 34.0, 48.0, 35.0, 44.0, 30.0, 30.0, 23.0, 22.0, 18.0, 23.0, 22.0, 14.0, 14.0, 12.0, 10.0, 15.0, 13.0, 5.0, 8.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0], "bins": [-12.7734375, -12.384521484375, -11.99560546875, -11.606689453125, -11.2177734375, -10.828857421875, -10.43994140625, -10.051025390625, -9.662109375, -9.273193359375, -8.88427734375, -8.495361328125, -8.1064453125, -7.717529296875, -7.32861328125, -6.939697265625, -6.55078125, -6.161865234375, -5.77294921875, -5.384033203125, -4.9951171875, -4.606201171875, -4.21728515625, -3.828369140625, -3.439453125, -3.050537109375, -2.66162109375, -2.272705078125, -1.8837890625, -1.494873046875, -1.10595703125, -0.717041015625, -0.328125, 0.060791015625, 0.44970703125, 0.838623046875, 1.2275390625, 1.616455078125, 2.00537109375, 2.394287109375, 2.783203125, 3.172119140625, 3.56103515625, 3.949951171875, 4.3388671875, 4.727783203125, 5.11669921875, 5.505615234375, 5.89453125, 6.283447265625, 6.67236328125, 7.061279296875, 7.4501953125, 7.839111328125, 8.22802734375, 8.616943359375, 9.005859375, 9.394775390625, 9.78369140625, 10.172607421875, 10.5615234375, 10.950439453125, 11.33935546875, 11.728271484375, 12.1171875]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [1.0, 3.0, 6.0, 2.0, 4.0, 4.0, 8.0, 8.0, 9.0, 10.0, 8.0, 17.0, 19.0, 13.0, 44.0, 72.0, 102.0, 132.0, 147.0, 232.0, 363.0, 550.0, 820.0, 1268.0, 2252.0, 3857.0, 7165.0, 14495.0, 31165.0, 71220.0, 198695.0, 5734360.0, 125225.0, 51279.0, 23007.0, 10842.0, 5729.0, 3179.0, 1928.0, 1016.0, 715.0, 465.0, 282.0, 189.0, 145.0, 98.0, 86.0, 60.0, 38.0, 31.0, 22.0, 21.0, 6.0, 9.0, 12.0, 5.0, 4.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-8.484375, -8.21337890625, -7.9423828125, -7.67138671875, -7.400390625, -7.12939453125, -6.8583984375, -6.58740234375, -6.31640625, -6.04541015625, -5.7744140625, -5.50341796875, -5.232421875, -4.96142578125, -4.6904296875, -4.41943359375, -4.1484375, -3.87744140625, -3.6064453125, -3.33544921875, -3.064453125, -2.79345703125, -2.5224609375, -2.25146484375, -1.98046875, -1.70947265625, -1.4384765625, -1.16748046875, -0.896484375, -0.62548828125, -0.3544921875, -0.08349609375, 0.1875, 0.45849609375, 0.7294921875, 1.00048828125, 1.271484375, 1.54248046875, 1.8134765625, 2.08447265625, 2.35546875, 2.62646484375, 2.8974609375, 3.16845703125, 3.439453125, 3.71044921875, 3.9814453125, 4.25244140625, 4.5234375, 4.79443359375, 5.0654296875, 5.33642578125, 5.607421875, 5.87841796875, 6.1494140625, 6.42041015625, 6.69140625, 6.96240234375, 7.2333984375, 7.50439453125, 7.775390625, 8.04638671875, 8.3173828125, 8.58837890625, 8.859375]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 5.0, 7.0, 5.0, 8.0, 10.0, 13.0, 13.0, 9.0, 16.0, 20.0, 22.0, 24.0, 26.0, 26.0, 36.0, 36.0, 33.0, 30.0, 38.0, 49.0, 225.0, 786.0, 130.0, 61.0, 47.0, 34.0, 33.0, 37.0, 28.0, 27.0, 23.0, 26.0, 28.0, 26.0, 16.0, 10.0, 9.0, 12.0, 8.0, 11.0, 10.0, 6.0, 3.0, 2.0, 5.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-12.546875, -12.1827392578125, -11.818603515625, -11.4544677734375, -11.09033203125, -10.7261962890625, -10.362060546875, -9.9979248046875, -9.6337890625, -9.2696533203125, -8.905517578125, -8.5413818359375, -8.17724609375, -7.8131103515625, -7.448974609375, -7.0848388671875, -6.720703125, -6.3565673828125, -5.992431640625, -5.6282958984375, -5.26416015625, -4.9000244140625, -4.535888671875, -4.1717529296875, -3.8076171875, -3.4434814453125, -3.079345703125, -2.7152099609375, -2.35107421875, -1.9869384765625, -1.622802734375, -1.2586669921875, -0.89453125, -0.5303955078125, -0.166259765625, 0.1978759765625, 0.56201171875, 0.9261474609375, 1.290283203125, 1.6544189453125, 2.0185546875, 2.3826904296875, 2.746826171875, 3.1109619140625, 3.47509765625, 3.8392333984375, 4.203369140625, 4.5675048828125, 4.931640625, 5.2957763671875, 5.659912109375, 6.0240478515625, 6.38818359375, 6.7523193359375, 7.116455078125, 7.4805908203125, 7.8447265625, 8.2088623046875, 8.572998046875, 8.9371337890625, 9.30126953125, 9.6654052734375, 10.029541015625, 10.3936767578125, 10.7578125]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 5.0, 1.0, 4.0, 2.0, 8.0, 11.0, 14.0, 16.0, 29.0, 33.0, 66.0, 72.0, 94.0, 133.0, 130.0, 132.0, 77.0, 48.0, 35.0, 28.0, 17.0, 18.0, 8.0, 3.0, 5.0, 7.0, 4.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.085384368896484, -23.286029815673828, -22.486675262451172, -21.68732261657715, -20.887968063354492, -20.088613510131836, -19.289260864257812, -18.489906311035156, -17.6905517578125, -16.891197204589844, -16.091842651367188, -15.292490005493164, -14.493135452270508, -13.693780899047852, -12.894427299499512, -12.095073699951172, -11.295719146728516, -10.49636459350586, -9.69701099395752, -8.89765739440918, -8.098302841186523, -7.298948764801025, -6.499594688415527, -5.700240612030029, -4.900886535644531, -4.101532459259033, -3.302178382873535, -2.502824306488037, -1.703470230102539, -0.904116153717041, -0.10476207733154297, 0.6945919990539551, 1.4939441680908203, 2.2932982444763184, 3.0926523208618164, 3.8920063972473145, 4.6913604736328125, 5.4907145500183105, 6.290068626403809, 7.089422702789307, 7.888776779174805, 8.688131332397461, 9.4874849319458, 10.28683853149414, 11.086193084716797, 11.885547637939453, 12.684901237487793, 13.484254837036133, 14.283609390258789, 15.082963943481445, 15.882317543029785, 16.681671142578125, 17.48102569580078, 18.280380249023438, 19.079734802246094, 19.879087448120117, 20.678442001342773, 21.47779655456543, 22.277149200439453, 23.07650375366211, 23.875858306884766, 24.675212860107422, 25.474567413330078, 26.2739200592041, 27.073274612426758]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 7.0, 3.0, 9.0, 9.0, 26.0, 16.0, 21.0, 29.0, 50.0, 61.0, 57.0, 74.0, 94.0, 96.0, 92.0, 91.0, 64.0, 51.0, 34.0, 31.0, 29.0, 22.0, 10.0, 8.0, 6.0, 6.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.219627380371094, -43.7860107421875, -42.35239791870117, -40.91878128051758, -39.48516845703125, -38.051551818847656, -36.61793518066406, -35.18431854248047, -33.75070571899414, -32.31708908081055, -30.88347625732422, -29.449859619140625, -28.016244888305664, -26.582630157470703, -25.14901351928711, -23.71539878845215, -22.281784057617188, -20.848169326782227, -19.414554595947266, -17.980937957763672, -16.54732322692871, -15.11370849609375, -13.680092811584473, -12.246477127075195, -10.812862396240234, -9.379247665405273, -7.945631980895996, -6.512016773223877, -5.078401565551758, -3.6447863578796387, -2.2111711502075195, -0.7775554656982422, 0.6560592651367188, 2.089674472808838, 3.523289680480957, 4.956904888153076, 6.390520095825195, 7.8241353034973145, 9.257750511169434, 10.691366195678711, 12.124980926513672, 13.558595657348633, 14.99221134185791, 16.425827026367188, 17.85944175720215, 19.29305648803711, 20.726673126220703, 22.160287857055664, 23.593902587890625, 25.027517318725586, 26.461132049560547, 27.89474868774414, 29.3283634185791, 30.761978149414062, 32.195594787597656, 33.62921142578125, 35.06282424926758, 36.49644088745117, 37.9300537109375, 39.363670349121094, 40.79728698730469, 42.230899810791016, 43.66451644897461, 45.09812927246094, 46.53174591064453]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 3.0, 2.0, 4.0, 7.0, 6.0, 7.0, 5.0, 16.0, 20.0, 14.0, 39.0, 34.0, 52.0, 81.0, 101.0, 159.0, 212.0, 313.0, 457.0, 775.0, 1185.0, 2053.0, 3938.0, 8291.0, 22207.0, 103419.0, 3934269.0, 77218.0, 20115.0, 8370.0, 4210.0, 2318.0, 1406.0, 899.0, 578.0, 440.0, 276.0, 207.0, 154.0, 119.0, 83.0, 67.0, 33.0, 46.0, 16.0, 14.0, 15.0, 12.0, 10.0, 4.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.025390625, -0.9937820434570312, -0.9621734619140625, -0.9305648803710938, -0.898956298828125, -0.8673477172851562, -0.8357391357421875, -0.8041305541992188, -0.77252197265625, -0.7409133911132812, -0.7093048095703125, -0.6776962280273438, -0.646087646484375, -0.6144790649414062, -0.5828704833984375, -0.5512619018554688, -0.5196533203125, -0.48804473876953125, -0.4564361572265625, -0.42482757568359375, -0.393218994140625, -0.36161041259765625, -0.3300018310546875, -0.29839324951171875, -0.26678466796875, -0.23517608642578125, -0.2035675048828125, -0.17195892333984375, -0.140350341796875, -0.10874176025390625, -0.0771331787109375, -0.04552459716796875, -0.013916015625, 0.01769256591796875, 0.0493011474609375, 0.08090972900390625, 0.112518310546875, 0.14412689208984375, 0.1757354736328125, 0.20734405517578125, 0.23895263671875, 0.27056121826171875, 0.3021697998046875, 0.33377838134765625, 0.365386962890625, 0.39699554443359375, 0.4286041259765625, 0.46021270751953125, 0.4918212890625, 0.5234298706054688, 0.5550384521484375, 0.5866470336914062, 0.618255615234375, 0.6498641967773438, 0.6814727783203125, 0.7130813598632812, 0.74468994140625, 0.7762985229492188, 0.8079071044921875, 0.8395156860351562, 0.871124267578125, 0.9027328491210938, 0.9343414306640625, 0.9659500122070312, 0.99755859375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 0.0, 4.0, 4.0, 5.0, 8.0, 3.0, 6.0, 8.0, 16.0, 10.0, 12.0, 24.0, 134.0, 669.0, 16.0, 11.0, 10.0, 17.0, 8.0, 4.0, 4.0, 5.0, 1.0, 5.0, 5.0, 1.0, 4.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.303955078125, -0.29450225830078125, -0.2850494384765625, -0.27559661865234375, -0.266143798828125, -0.25669097900390625, -0.2472381591796875, -0.23778533935546875, -0.22833251953125, -0.21887969970703125, -0.2094268798828125, -0.19997406005859375, -0.190521240234375, -0.18106842041015625, -0.1716156005859375, -0.16216278076171875, -0.1527099609375, -0.14325714111328125, -0.1338043212890625, -0.12435150146484375, -0.114898681640625, -0.10544586181640625, -0.0959930419921875, -0.08654022216796875, -0.07708740234375, -0.06763458251953125, -0.0581817626953125, -0.04872894287109375, -0.039276123046875, -0.02982330322265625, -0.0203704833984375, -0.01091766357421875, -0.00146484375, 0.00798797607421875, 0.0174407958984375, 0.02689361572265625, 0.036346435546875, 0.04579925537109375, 0.0552520751953125, 0.06470489501953125, 0.07415771484375, 0.08361053466796875, 0.0930633544921875, 0.10251617431640625, 0.111968994140625, 0.12142181396484375, 0.1308746337890625, 0.14032745361328125, 0.1497802734375, 0.15923309326171875, 0.1686859130859375, 0.17813873291015625, 0.187591552734375, 0.19704437255859375, 0.2064971923828125, 0.21595001220703125, 0.22540283203125, 0.23485565185546875, 0.2443084716796875, 0.25376129150390625, 0.263214111328125, 0.27266693115234375, 0.2821197509765625, 0.29157257080078125, 0.301025390625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 8.0, 6.0, 7.0, 17.0, 28.0, 26.0, 59.0, 80.0, 133.0, 205.0, 333.0, 535.0, 807.0, 1414.0, 2539.0, 4896.0, 10233.0, 26102.0, 82879.0, 489448.0, 3179223.0, 298901.0, 60327.0, 19506.0, 7983.0, 3735.0, 2017.0, 1141.0, 648.0, 388.0, 241.0, 136.0, 98.0, 64.0, 48.0, 23.0, 18.0, 12.0, 9.0, 7.0, 1.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.72412109375, -0.7017669677734375, -0.679412841796875, -0.6570587158203125, -0.63470458984375, -0.6123504638671875, -0.589996337890625, -0.5676422119140625, -0.5452880859375, -0.5229339599609375, -0.500579833984375, -0.4782257080078125, -0.45587158203125, -0.4335174560546875, -0.411163330078125, -0.3888092041015625, -0.366455078125, -0.3441009521484375, -0.321746826171875, -0.2993927001953125, -0.27703857421875, -0.2546844482421875, -0.232330322265625, -0.2099761962890625, -0.1876220703125, -0.1652679443359375, -0.142913818359375, -0.1205596923828125, -0.09820556640625, -0.0758514404296875, -0.053497314453125, -0.0311431884765625, -0.0087890625, 0.0135650634765625, 0.035919189453125, 0.0582733154296875, 0.08062744140625, 0.1029815673828125, 0.125335693359375, 0.1476898193359375, 0.1700439453125, 0.1923980712890625, 0.214752197265625, 0.2371063232421875, 0.25946044921875, 0.2818145751953125, 0.304168701171875, 0.3265228271484375, 0.348876953125, 0.3712310791015625, 0.393585205078125, 0.4159393310546875, 0.43829345703125, 0.4606475830078125, 0.483001708984375, 0.5053558349609375, 0.5277099609375, 0.5500640869140625, 0.572418212890625, 0.5947723388671875, 0.61712646484375, 0.6394805908203125, 0.661834716796875, 0.6841888427734375, 0.70654296875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 6.0, 4.0, 4.0, 2.0, 5.0, 6.0, 3.0, 7.0, 11.0, 14.0, 26.0, 27.0, 38.0, 55.0, 63.0, 112.0, 220.0, 419.0, 1340.0, 935.0, 321.0, 170.0, 91.0, 61.0, 38.0, 29.0, 25.0, 12.0, 10.0, 5.0, 3.0, 2.0, 5.0, 1.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.382080078125, -0.37078857421875, -0.3594970703125, -0.34820556640625, -0.3369140625, -0.32562255859375, -0.3143310546875, -0.30303955078125, -0.291748046875, -0.28045654296875, -0.2691650390625, -0.25787353515625, -0.24658203125, -0.23529052734375, -0.2239990234375, -0.21270751953125, -0.201416015625, -0.19012451171875, -0.1788330078125, -0.16754150390625, -0.15625, -0.14495849609375, -0.1336669921875, -0.12237548828125, -0.111083984375, -0.09979248046875, -0.0885009765625, -0.07720947265625, -0.06591796875, -0.05462646484375, -0.0433349609375, -0.03204345703125, -0.020751953125, -0.00946044921875, 0.0018310546875, 0.01312255859375, 0.0244140625, 0.03570556640625, 0.0469970703125, 0.05828857421875, 0.069580078125, 0.08087158203125, 0.0921630859375, 0.10345458984375, 0.11474609375, 0.12603759765625, 0.1373291015625, 0.14862060546875, 0.159912109375, 0.17120361328125, 0.1824951171875, 0.19378662109375, 0.205078125, 0.21636962890625, 0.2276611328125, 0.23895263671875, 0.250244140625, 0.26153564453125, 0.2728271484375, 0.28411865234375, 0.29541015625, 0.30670166015625, 0.3179931640625, 0.32928466796875, 0.340576171875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 7.0, 12.0, 15.0, 40.0, 61.0, 139.0, 183.0, 221.0, 131.0, 92.0, 53.0, 29.0, 6.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.9518307447433472, -1.8877747058868408, -1.8237186670303345, -1.7596626281738281, -1.6956065893173218, -1.6315505504608154, -1.5674943923950195, -1.5034384727478027, -1.4393823146820068, -1.3753262758255005, -1.3112702369689941, -1.2472141981124878, -1.1831581592559814, -1.119102120399475, -1.0550460815429688, -0.9909899830818176, -0.926934003829956, -0.8628779649734497, -0.7988219261169434, -0.734765887260437, -0.6707098484039307, -0.6066538095474243, -0.5425977110862732, -0.47854167222976685, -0.4144856333732605, -0.35042959451675415, -0.2863735556602478, -0.22231748700141907, -0.15826144814491272, -0.09420540928840637, -0.030149340629577637, 0.03390669822692871, 0.09796285629272461, 0.16201889514923096, 0.2260749489068985, 0.29013100266456604, 0.3541870415210724, 0.41824308037757874, 0.48229914903640747, 0.5463551878929138, 0.6104112267494202, 0.6744672656059265, 0.7385233044624329, 0.802579402923584, 0.8666354417800903, 0.9306914806365967, 0.994747519493103, 1.0588035583496094, 1.1228595972061157, 1.186915636062622, 1.2509716749191284, 1.3150277137756348, 1.3790837526321411, 1.4431397914886475, 1.5071959495544434, 1.5712518692016602, 1.635308027267456, 1.6993640661239624, 1.7634201049804688, 1.827476143836975, 1.8915321826934814, 1.9555882215499878, 2.019644260406494, 2.08370041847229, 2.147756338119507]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 3.0, 3.0, 3.0, 1.0, 4.0, 12.0, 11.0, 16.0, 22.0, 22.0, 34.0, 34.0, 47.0, 58.0, 55.0, 59.0, 75.0, 86.0, 71.0, 78.0, 61.0, 55.0, 49.0, 40.0, 29.0, 19.0, 12.0, 15.0, 17.0, 7.0, 5.0, 9.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5357944965362549, -1.4858287572860718, -1.4358630180358887, -1.3858972787857056, -1.3359315395355225, -1.285965919494629, -1.2360001802444458, -1.1860344409942627, -1.1360687017440796, -1.0861029624938965, -1.0361372232437134, -0.986171543598175, -0.9362058043479919, -0.8862400650978088, -0.8362743854522705, -0.7863086462020874, -0.7363429069519043, -0.6863771677017212, -0.6364114284515381, -0.5864457488059998, -0.5364800095558167, -0.48651427030563354, -0.4365485608577728, -0.3865828514099121, -0.336617112159729, -0.2866513729095459, -0.23668566346168518, -0.18671993911266327, -0.13675421476364136, -0.08678849041461945, -0.036822766065597534, 0.013142943382263184, 0.06310880184173584, 0.11307452619075775, 0.16304025053977966, 0.21300597488880157, 0.2629716992378235, 0.3129374384880066, 0.3629031479358673, 0.412868857383728, 0.46283459663391113, 0.5128003358840942, 0.5627660751342773, 0.6127317547798157, 0.6626974940299988, 0.7126632332801819, 0.7626289129257202, 0.8125946521759033, 0.8625603914260864, 0.9125261306762695, 0.9624918699264526, 1.0124576091766357, 1.0624232292175293, 1.1123889684677124, 1.1623547077178955, 1.2123204469680786, 1.2622861862182617, 1.3122519254684448, 1.362217664718628, 1.412183403968811, 1.4621491432189941, 1.5121147632598877, 1.5620805025100708, 1.612046241760254, 1.662011981010437]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 3.0, 3.0, 7.0, 11.0, 16.0, 23.0, 36.0, 46.0, 66.0, 78.0, 132.0, 180.0, 279.0, 353.0, 531.0, 715.0, 1045.0, 1611.0, 2498.0, 3894.0, 6443.0, 11357.0, 22655.0, 94297.0, 818239.0, 42155.0, 17335.0, 9247.0, 5385.0, 3254.0, 2114.0, 1378.0, 983.0, 657.0, 462.0, 318.0, 230.0, 167.0, 112.0, 81.0, 50.0, 29.0, 22.0, 23.0, 15.0, 12.0, 8.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9169921875, -0.8886184692382812, -0.8602447509765625, -0.8318710327148438, -0.803497314453125, -0.7751235961914062, -0.7467498779296875, -0.7183761596679688, -0.69000244140625, -0.6616287231445312, -0.6332550048828125, -0.6048812866210938, -0.576507568359375, -0.5481338500976562, -0.5197601318359375, -0.49138641357421875, -0.4630126953125, -0.43463897705078125, -0.4062652587890625, -0.37789154052734375, -0.349517822265625, -0.32114410400390625, -0.2927703857421875, -0.26439666748046875, -0.23602294921875, -0.20764923095703125, -0.1792755126953125, -0.15090179443359375, -0.122528076171875, -0.09415435791015625, -0.0657806396484375, -0.03740692138671875, -0.009033203125, 0.01934051513671875, 0.0477142333984375, 0.07608795166015625, 0.104461669921875, 0.13283538818359375, 0.1612091064453125, 0.18958282470703125, 0.21795654296875, 0.24633026123046875, 0.2747039794921875, 0.30307769775390625, 0.331451416015625, 0.35982513427734375, 0.3881988525390625, 0.41657257080078125, 0.4449462890625, 0.47332000732421875, 0.5016937255859375, 0.5300674438476562, 0.558441162109375, 0.5868148803710938, 0.6151885986328125, 0.6435623168945312, 0.67193603515625, 0.7003097534179688, 0.7286834716796875, 0.7570571899414062, 0.785430908203125, 0.8138046264648438, 0.8421783447265625, 0.8705520629882812, 0.89892578125]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 1.0, 3.0, 5.0, 2.0, 9.0, 3.0, 5.0, 5.0, 11.0, 9.0, 19.0, 20.0, 82.0, 405.0, 299.0, 45.0, 9.0, 10.0, 14.0, 6.0, 5.0, 7.0, 3.0, 4.0, 3.0, 3.0, 3.0, 4.0, 3.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2822265625, -0.27338409423828125, -0.2645416259765625, -0.25569915771484375, -0.246856689453125, -0.23801422119140625, -0.2291717529296875, -0.22032928466796875, -0.21148681640625, -0.20264434814453125, -0.1938018798828125, -0.18495941162109375, -0.176116943359375, -0.16727447509765625, -0.1584320068359375, -0.14958953857421875, -0.1407470703125, -0.13190460205078125, -0.1230621337890625, -0.11421966552734375, -0.105377197265625, -0.09653472900390625, -0.0876922607421875, -0.07884979248046875, -0.07000732421875, -0.06116485595703125, -0.0523223876953125, -0.04347991943359375, -0.034637451171875, -0.02579498291015625, -0.0169525146484375, -0.00811004638671875, 0.000732421875, 0.00957489013671875, 0.0184173583984375, 0.02725982666015625, 0.036102294921875, 0.04494476318359375, 0.0537872314453125, 0.06262969970703125, 0.07147216796875, 0.08031463623046875, 0.0891571044921875, 0.09799957275390625, 0.106842041015625, 0.11568450927734375, 0.1245269775390625, 0.13336944580078125, 0.1422119140625, 0.15105438232421875, 0.1598968505859375, 0.16873931884765625, 0.177581787109375, 0.18642425537109375, 0.1952667236328125, 0.20410919189453125, 0.21295166015625, 0.22179412841796875, 0.2306365966796875, 0.23947906494140625, 0.248321533203125, 0.25716400146484375, 0.2660064697265625, 0.27484893798828125, 0.28369140625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 5.0, 3.0, 2.0, 3.0, 6.0, 11.0, 12.0, 19.0, 28.0, 29.0, 59.0, 78.0, 105.0, 127.0, 187.0, 257.0, 400.0, 629.0, 966.0, 1425.0, 2361.0, 4091.0, 6827.0, 12397.0, 22583.0, 43917.0, 90770.0, 208490.0, 333726.0, 164491.0, 73426.0, 36048.0, 19150.0, 10370.0, 5988.0, 3524.0, 2084.0, 1368.0, 827.0, 555.0, 378.0, 252.0, 177.0, 118.0, 73.0, 65.0, 38.0, 43.0, 22.0, 20.0, 11.0, 7.0, 7.0, 5.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.548828125, -0.5301361083984375, -0.511444091796875, -0.4927520751953125, -0.47406005859375, -0.4553680419921875, -0.436676025390625, -0.4179840087890625, -0.3992919921875, -0.3805999755859375, -0.361907958984375, -0.3432159423828125, -0.32452392578125, -0.3058319091796875, -0.287139892578125, -0.2684478759765625, -0.249755859375, -0.2310638427734375, -0.212371826171875, -0.1936798095703125, -0.17498779296875, -0.1562957763671875, -0.137603759765625, -0.1189117431640625, -0.1002197265625, -0.0815277099609375, -0.062835693359375, -0.0441436767578125, -0.02545166015625, -0.0067596435546875, 0.011932373046875, 0.0306243896484375, 0.04931640625, 0.0680084228515625, 0.086700439453125, 0.1053924560546875, 0.12408447265625, 0.1427764892578125, 0.161468505859375, 0.1801605224609375, 0.1988525390625, 0.2175445556640625, 0.236236572265625, 0.2549285888671875, 0.27362060546875, 0.2923126220703125, 0.311004638671875, 0.3296966552734375, 0.348388671875, 0.3670806884765625, 0.385772705078125, 0.4044647216796875, 0.42315673828125, 0.4418487548828125, 0.460540771484375, 0.4792327880859375, 0.4979248046875, 0.5166168212890625, 0.535308837890625, 0.5540008544921875, 0.57269287109375, 0.5913848876953125, 0.610076904296875, 0.6287689208984375, 0.6474609375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 5.0, 5.0, 5.0, 11.0, 16.0, 11.0, 9.0, 21.0, 22.0, 16.0, 25.0, 32.0, 35.0, 31.0, 32.0, 44.0, 34.0, 33.0, 44.0, 48.0, 46.0, 49.0, 48.0, 50.0, 36.0, 42.0, 36.0, 29.0, 28.0, 27.0, 22.0, 17.0, 13.0, 23.0, 11.0, 16.0, 10.0, 7.0, 3.0, 5.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0], "bins": [-1.1455078125, -1.1130828857421875, -1.080657958984375, -1.0482330322265625, -1.01580810546875, -0.9833831787109375, -0.950958251953125, -0.9185333251953125, -0.8861083984375, -0.8536834716796875, -0.821258544921875, -0.7888336181640625, -0.75640869140625, -0.7239837646484375, -0.691558837890625, -0.6591339111328125, -0.626708984375, -0.5942840576171875, -0.561859130859375, -0.5294342041015625, -0.49700927734375, -0.4645843505859375, -0.432159423828125, -0.3997344970703125, -0.3673095703125, -0.3348846435546875, -0.302459716796875, -0.2700347900390625, -0.23760986328125, -0.2051849365234375, -0.172760009765625, -0.1403350830078125, -0.10791015625, -0.0754852294921875, -0.043060302734375, -0.0106353759765625, 0.02178955078125, 0.0542144775390625, 0.086639404296875, 0.1190643310546875, 0.1514892578125, 0.1839141845703125, 0.216339111328125, 0.2487640380859375, 0.28118896484375, 0.3136138916015625, 0.346038818359375, 0.3784637451171875, 0.410888671875, 0.4433135986328125, 0.475738525390625, 0.5081634521484375, 0.54058837890625, 0.5730133056640625, 0.605438232421875, 0.6378631591796875, 0.6702880859375, 0.7027130126953125, 0.735137939453125, 0.7675628662109375, 0.79998779296875, 0.8324127197265625, 0.864837646484375, 0.8972625732421875, 0.9296875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 5.0, 5.0, 10.0, 17.0, 28.0, 37.0, 66.0, 146.0, 383.0, 1507.0, 13761.0, 969298.0, 59222.0, 3063.0, 583.0, 205.0, 93.0, 54.0, 31.0, 14.0, 15.0, 7.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.400390625, -3.3023681640625, -3.204345703125, -3.1063232421875, -3.00830078125, -2.9102783203125, -2.812255859375, -2.7142333984375, -2.6162109375, -2.5181884765625, -2.420166015625, -2.3221435546875, -2.22412109375, -2.1260986328125, -2.028076171875, -1.9300537109375, -1.83203125, -1.7340087890625, -1.635986328125, -1.5379638671875, -1.43994140625, -1.3419189453125, -1.243896484375, -1.1458740234375, -1.0478515625, -0.9498291015625, -0.851806640625, -0.7537841796875, -0.65576171875, -0.5577392578125, -0.459716796875, -0.3616943359375, -0.263671875, -0.1656494140625, -0.067626953125, 0.0303955078125, 0.12841796875, 0.2264404296875, 0.324462890625, 0.4224853515625, 0.5205078125, 0.6185302734375, 0.716552734375, 0.8145751953125, 0.91259765625, 1.0106201171875, 1.108642578125, 1.2066650390625, 1.3046875, 1.4027099609375, 1.500732421875, 1.5987548828125, 1.69677734375, 1.7947998046875, 1.892822265625, 1.9908447265625, 2.0888671875, 2.1868896484375, 2.284912109375, 2.3829345703125, 2.48095703125, 2.5789794921875, 2.677001953125, 2.7750244140625, 2.873046875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 6.0, 7.0, 9.0, 23.0, 59.0, 101.0, 170.0, 211.0, 195.0, 90.0, 73.0, 28.0, 14.0, 9.0, 9.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001780986785888672, -0.00017400365322828293, -0.00016990862786769867, -0.0001658136025071144, -0.00016171857714653015, -0.0001576235517859459, -0.00015352852642536163, -0.00014943350106477737, -0.00014533847570419312, -0.00014124345034360886, -0.0001371484249830246, -0.00013305339962244034, -0.00012895837426185608, -0.00012486334890127182, -0.00012076832354068756, -0.0001166732981801033, -0.00011257827281951904, -0.00010848324745893478, -0.00010438822209835052, -0.00010029319673776627, -9.619817137718201e-05, -9.210314601659775e-05, -8.800812065601349e-05, -8.391309529542923e-05, -7.981806993484497e-05, -7.572304457426071e-05, -7.162801921367645e-05, -6.75329938530922e-05, -6.343796849250793e-05, -5.9342943131923676e-05, -5.5247917771339417e-05, -5.115289241075516e-05, -4.70578670501709e-05, -4.296284168958664e-05, -3.886781632900238e-05, -3.477279096841812e-05, -3.067776560783386e-05, -2.6582740247249603e-05, -2.2487714886665344e-05, -1.8392689526081085e-05, -1.4297664165496826e-05, -1.0202638804912567e-05, -6.107613444328308e-06, -2.012588083744049e-06, 2.08243727684021e-06, 6.177462637424469e-06, 1.0272487998008728e-05, 1.4367513358592987e-05, 1.8462538719177246e-05, 2.2557564079761505e-05, 2.6652589440345764e-05, 3.074761480093002e-05, 3.484264016151428e-05, 3.893766552209854e-05, 4.30326908826828e-05, 4.712771624326706e-05, 5.122274160385132e-05, 5.531776696443558e-05, 5.9412792325019836e-05, 6.35078176856041e-05, 6.760284304618835e-05, 7.169786840677261e-05, 7.579289376735687e-05, 7.988791912794113e-05, 8.398294448852539e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 6.0, 4.0, 3.0, 5.0, 5.0, 8.0, 15.0, 22.0, 25.0, 40.0, 51.0, 77.0, 118.0, 214.0, 340.0, 652.0, 1574.0, 3997.0, 14091.0, 81610.0, 685396.0, 221721.0, 27545.0, 6560.0, 2275.0, 990.0, 480.0, 299.0, 132.0, 120.0, 58.0, 48.0, 25.0, 22.0, 13.0, 7.0, 3.0, 6.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0263671875, -0.987945556640625, -0.94952392578125, -0.911102294921875, -0.8726806640625, -0.834259033203125, -0.79583740234375, -0.757415771484375, -0.718994140625, -0.680572509765625, -0.64215087890625, -0.603729248046875, -0.5653076171875, -0.526885986328125, -0.48846435546875, -0.450042724609375, -0.41162109375, -0.373199462890625, -0.33477783203125, -0.296356201171875, -0.2579345703125, -0.219512939453125, -0.18109130859375, -0.142669677734375, -0.104248046875, -0.065826416015625, -0.02740478515625, 0.011016845703125, 0.0494384765625, 0.087860107421875, 0.12628173828125, 0.164703369140625, 0.203125, 0.241546630859375, 0.27996826171875, 0.318389892578125, 0.3568115234375, 0.395233154296875, 0.43365478515625, 0.472076416015625, 0.510498046875, 0.548919677734375, 0.58734130859375, 0.625762939453125, 0.6641845703125, 0.702606201171875, 0.74102783203125, 0.779449462890625, 0.81787109375, 0.856292724609375, 0.89471435546875, 0.933135986328125, 0.9715576171875, 1.009979248046875, 1.04840087890625, 1.086822509765625, 1.125244140625, 1.163665771484375, 1.20208740234375, 1.240509033203125, 1.2789306640625, 1.317352294921875, 1.35577392578125, 1.394195556640625, 1.4326171875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 9.0, 8.0, 11.0, 25.0, 40.0, 43.0, 91.0, 121.0, 121.0, 131.0, 131.0, 105.0, 68.0, 34.0, 21.0, 17.0, 9.0, 6.0, 2.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9443359375, -0.899139404296875, -0.85394287109375, -0.808746337890625, -0.7635498046875, -0.718353271484375, -0.67315673828125, -0.627960205078125, -0.582763671875, -0.537567138671875, -0.49237060546875, -0.447174072265625, -0.4019775390625, -0.356781005859375, -0.31158447265625, -0.266387939453125, -0.22119140625, -0.175994873046875, -0.13079833984375, -0.085601806640625, -0.0404052734375, 0.004791259765625, 0.04998779296875, 0.095184326171875, 0.140380859375, 0.185577392578125, 0.23077392578125, 0.275970458984375, 0.3211669921875, 0.366363525390625, 0.41156005859375, 0.456756591796875, 0.501953125, 0.547149658203125, 0.59234619140625, 0.637542724609375, 0.6827392578125, 0.727935791015625, 0.77313232421875, 0.818328857421875, 0.863525390625, 0.908721923828125, 0.95391845703125, 0.999114990234375, 1.0443115234375, 1.089508056640625, 1.13470458984375, 1.179901123046875, 1.22509765625, 1.270294189453125, 1.31549072265625, 1.360687255859375, 1.4058837890625, 1.451080322265625, 1.49627685546875, 1.541473388671875, 1.586669921875, 1.631866455078125, 1.67706298828125, 1.722259521484375, 1.7674560546875, 1.812652587890625, 1.85784912109375, 1.903045654296875, 1.9482421875]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 5.0, 9.0, 14.0, 11.0, 28.0, 45.0, 91.0, 168.0, 233.0, 164.0, 81.0, 53.0, 38.0, 23.0, 14.0, 7.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.532609939575195, -9.185256004333496, -8.837903022766113, -8.490549087524414, -8.143196105957031, -7.795842170715332, -7.448488235473633, -7.101134777069092, -6.753781318664551, -6.40642786026001, -6.059074401855469, -5.7117204666137695, -5.3643670082092285, -5.0170135498046875, -4.669659614562988, -4.322306156158447, -3.9749526977539062, -3.6275992393493652, -3.280245542526245, -2.932891845703125, -2.585538387298584, -2.238184928894043, -1.8908312320709229, -1.5434775352478027, -1.1961240768432617, -0.8487704992294312, -0.5014169216156006, -0.15406334400177002, 0.19329023361206055, 0.5406438112258911, 0.8879973888397217, 1.2353510856628418, 1.5827054977416992, 1.9300590753555298, 2.2774126529693604, 2.6247663497924805, 2.9721198081970215, 3.3194732666015625, 3.6668269634246826, 4.014180660247803, 4.361534118652344, 4.708887577056885, 5.056241035461426, 5.403594970703125, 5.750948429107666, 6.098301887512207, 6.445655822753906, 6.793009281158447, 7.140362739562988, 7.487716197967529, 7.83506965637207, 8.18242359161377, 8.529777526855469, 8.877130508422852, 9.22448444366455, 9.57183837890625, 9.919191360473633, 10.266545295715332, 10.613898277282715, 10.961252212524414, 11.308605194091797, 11.655959129333496, 12.003313064575195, 12.350666046142578, 12.698019981384277]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 1.0, 2.0, 3.0, 3.0, 8.0, 9.0, 3.0, 8.0, 15.0, 15.0, 13.0, 39.0, 62.0, 106.0, 130.0, 167.0, 140.0, 99.0, 59.0, 30.0, 28.0, 14.0, 10.0, 6.0, 6.0, 5.0, 6.0, 0.0, 3.0, 5.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.883638381958008, -21.227081298828125, -20.57052230834961, -19.913965225219727, -19.257408142089844, -18.600849151611328, -17.944292068481445, -17.287734985351562, -16.631175994873047, -15.974617958068848, -15.318059921264648, -14.661502838134766, -14.004944801330566, -13.348386764526367, -12.691829681396484, -12.035271644592285, -11.378713607788086, -10.722155570983887, -10.065597534179688, -9.409040451049805, -8.752482414245605, -8.095924377441406, -7.439366817474365, -6.782809257507324, -6.126251220703125, -5.469693183898926, -4.813135623931885, -4.156578063964844, -3.5000200271606445, -2.8434622287750244, -2.1869044303894043, -1.5303468704223633, -0.8737907409667969, -0.21723294258117676, 0.43932485580444336, 1.0958826541900635, 1.7524404525756836, 2.4089982509613037, 3.065556049346924, 3.722113609313965, 4.378671646118164, 5.035229682922363, 5.691787242889404, 6.348344802856445, 7.0049028396606445, 7.661460876464844, 8.318017959594727, 8.974575996398926, 9.631134033203125, 10.287692070007324, 10.944250106811523, 11.600807189941406, 12.257365226745605, 12.913923263549805, 13.570480346679688, 14.227038383483887, 14.883596420288086, 15.540154457092285, 16.196712493896484, 16.853269577026367, 17.50982666015625, 18.166385650634766, 18.82294273376465, 19.47949981689453, 20.136058807373047]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 9.0, 4.0, 13.0, 16.0, 25.0, 20.0, 33.0, 52.0, 76.0, 104.0, 125.0, 195.0, 255.0, 351.0, 457.0, 609.0, 907.0, 1297.0, 1928.0, 3221.0, 5923.0, 13002.0, 38951.0, 468225.0, 3567649.0, 57537.0, 15798.0, 6954.0, 3611.0, 2226.0, 1443.0, 963.0, 677.0, 466.0, 344.0, 234.0, 151.0, 121.0, 76.0, 73.0, 43.0, 33.0, 24.0, 17.0, 18.0, 13.0, 6.0, 4.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.412109375, -2.33929443359375, -2.2664794921875, -2.19366455078125, -2.120849609375, -2.04803466796875, -1.9752197265625, -1.90240478515625, -1.82958984375, -1.75677490234375, -1.6839599609375, -1.61114501953125, -1.538330078125, -1.46551513671875, -1.3927001953125, -1.31988525390625, -1.2470703125, -1.17425537109375, -1.1014404296875, -1.02862548828125, -0.955810546875, -0.88299560546875, -0.8101806640625, -0.73736572265625, -0.66455078125, -0.59173583984375, -0.5189208984375, -0.44610595703125, -0.373291015625, -0.30047607421875, -0.2276611328125, -0.15484619140625, -0.08203125, -0.00921630859375, 0.0635986328125, 0.13641357421875, 0.209228515625, 0.28204345703125, 0.3548583984375, 0.42767333984375, 0.50048828125, 0.57330322265625, 0.6461181640625, 0.71893310546875, 0.791748046875, 0.86456298828125, 0.9373779296875, 1.01019287109375, 1.0830078125, 1.15582275390625, 1.2286376953125, 1.30145263671875, 1.374267578125, 1.44708251953125, 1.5198974609375, 1.59271240234375, 1.66552734375, 1.73834228515625, 1.8111572265625, 1.88397216796875, 1.956787109375, 2.02960205078125, 2.1024169921875, 2.17523193359375, 2.248046875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 3.0, 1.0, 6.0, 3.0, 4.0, 1.0, 4.0, 2.0, 2.0, 4.0, 3.0, 3.0, 9.0, 12.0, 13.0, 18.0, 10.0, 27.0, 54.0, 96.0, 164.0, 219.0, 134.0, 79.0, 27.0, 21.0, 11.0, 10.0, 12.0, 5.0, 7.0, 6.0, 5.0, 8.0, 5.0, 8.0, 1.0, 2.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2230224609375, -0.21610069274902344, -0.20917892456054688, -0.2022571563720703, -0.19533538818359375, -0.1884136199951172, -0.18149185180664062, -0.17457008361816406, -0.1676483154296875, -0.16072654724121094, -0.15380477905273438, -0.1468830108642578, -0.13996124267578125, -0.1330394744873047, -0.12611770629882812, -0.11919593811035156, -0.112274169921875, -0.10535240173339844, -0.09843063354492188, -0.09150886535644531, -0.08458709716796875, -0.07766532897949219, -0.07074356079101562, -0.06382179260253906, -0.0569000244140625, -0.04997825622558594, -0.043056488037109375, -0.03613471984863281, -0.02921295166015625, -0.022291183471679688, -0.015369415283203125, -0.008447647094726562, -0.00152587890625, 0.0053958892822265625, 0.012317657470703125, 0.019239425659179688, 0.02616119384765625, 0.03308296203613281, 0.040004730224609375, 0.04692649841308594, 0.0538482666015625, 0.06077003479003906, 0.06769180297851562, 0.07461357116699219, 0.08153533935546875, 0.08845710754394531, 0.09537887573242188, 0.10230064392089844, 0.109222412109375, 0.11614418029785156, 0.12306594848632812, 0.1299877166748047, 0.13690948486328125, 0.1438312530517578, 0.15075302124023438, 0.15767478942871094, 0.1645965576171875, 0.17151832580566406, 0.17844009399414062, 0.1853618621826172, 0.19228363037109375, 0.1992053985595703, 0.20612716674804688, 0.21304893493652344, 0.219970703125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 6.0, 7.0, 11.0, 15.0, 23.0, 21.0, 22.0, 43.0, 58.0, 76.0, 129.0, 162.0, 221.0, 385.0, 575.0, 813.0, 1251.0, 1941.0, 3234.0, 5487.0, 10211.0, 21073.0, 55148.0, 263442.0, 3427296.0, 299124.0, 58122.0, 21331.0, 10090.0, 5411.0, 3054.0, 1941.0, 1097.0, 777.0, 505.0, 371.0, 232.0, 161.0, 108.0, 81.0, 75.0, 42.0, 22.0, 25.0, 19.0, 17.0, 9.0, 9.0, 4.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.494140625, -1.4481964111328125, -1.402252197265625, -1.3563079833984375, -1.31036376953125, -1.2644195556640625, -1.218475341796875, -1.1725311279296875, -1.1265869140625, -1.0806427001953125, -1.034698486328125, -0.9887542724609375, -0.94281005859375, -0.8968658447265625, -0.850921630859375, -0.8049774169921875, -0.759033203125, -0.7130889892578125, -0.667144775390625, -0.6212005615234375, -0.57525634765625, -0.5293121337890625, -0.483367919921875, -0.4374237060546875, -0.3914794921875, -0.3455352783203125, -0.299591064453125, -0.2536468505859375, -0.20770263671875, -0.1617584228515625, -0.115814208984375, -0.0698699951171875, -0.02392578125, 0.0220184326171875, 0.067962646484375, 0.1139068603515625, 0.15985107421875, 0.2057952880859375, 0.251739501953125, 0.2976837158203125, 0.3436279296875, 0.3895721435546875, 0.435516357421875, 0.4814605712890625, 0.52740478515625, 0.5733489990234375, 0.619293212890625, 0.6652374267578125, 0.711181640625, 0.7571258544921875, 0.803070068359375, 0.8490142822265625, 0.89495849609375, 0.9409027099609375, 0.986846923828125, 1.0327911376953125, 1.0787353515625, 1.1246795654296875, 1.170623779296875, 1.2165679931640625, 1.26251220703125, 1.3084564208984375, 1.354400634765625, 1.4003448486328125, 1.4462890625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 5.0, 8.0, 2.0, 7.0, 12.0, 7.0, 12.0, 15.0, 10.0, 20.0, 25.0, 36.0, 43.0, 82.0, 178.0, 573.0, 2012.0, 483.0, 214.0, 124.0, 62.0, 40.0, 18.0, 17.0, 9.0, 15.0, 8.0, 9.0, 7.0, 3.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.453125, -0.4409942626953125, -0.428863525390625, -0.4167327880859375, -0.40460205078125, -0.3924713134765625, -0.380340576171875, -0.3682098388671875, -0.3560791015625, -0.3439483642578125, -0.331817626953125, -0.3196868896484375, -0.30755615234375, -0.2954254150390625, -0.283294677734375, -0.2711639404296875, -0.259033203125, -0.2469024658203125, -0.234771728515625, -0.2226409912109375, -0.21051025390625, -0.1983795166015625, -0.186248779296875, -0.1741180419921875, -0.1619873046875, -0.1498565673828125, -0.137725830078125, -0.1255950927734375, -0.11346435546875, -0.1013336181640625, -0.089202880859375, -0.0770721435546875, -0.06494140625, -0.0528106689453125, -0.040679931640625, -0.0285491943359375, -0.01641845703125, -0.0042877197265625, 0.007843017578125, 0.0199737548828125, 0.0321044921875, 0.0442352294921875, 0.056365966796875, 0.0684967041015625, 0.08062744140625, 0.0927581787109375, 0.104888916015625, 0.1170196533203125, 0.129150390625, 0.1412811279296875, 0.153411865234375, 0.1655426025390625, 0.17767333984375, 0.1898040771484375, 0.201934814453125, 0.2140655517578125, 0.2261962890625, 0.2383270263671875, 0.250457763671875, 0.2625885009765625, 0.27471923828125, 0.2868499755859375, 0.298980712890625, 0.3111114501953125, 0.3232421875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 5.0, 8.0, 39.0, 93.0, 370.0, 316.0, 83.0, 40.0, 19.0, 15.0, 4.0, 3.0, 3.0, 1.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7284982204437256, -1.5678640604019165, -1.4072299003601074, -1.2465956211090088, -1.0859615802764893, -0.9253273606300354, -0.7646931409835815, -0.6040589809417725, -0.4434248208999634, -0.2827906608581543, -0.12215647101402283, 0.03847771883010864, 0.19911187887191772, 0.3597460389137268, 0.5203802585601807, 0.6810144186019897, 0.8416485786437988, 1.002282738685608, 1.162916898727417, 1.3235511779785156, 1.4841852188110352, 1.6448194980621338, 1.8054536581039429, 1.966087818145752, 2.1267218589782715, 2.28735613822937, 2.4479901790618896, 2.6086244583129883, 2.769258499145508, 2.9298927783966064, 3.090527057647705, 3.2511610984802246, 3.411795139312744, 3.5724294185638428, 3.7330634593963623, 3.893697738647461, 4.0543317794799805, 4.2149658203125, 4.375600337982178, 4.536234378814697, 4.696868419647217, 4.857502460479736, 5.018136978149414, 5.178771018981934, 5.339405059814453, 5.500039100646973, 5.66067361831665, 5.82130765914917, 5.981942176818848, 6.142576217651367, 6.303210735321045, 6.4638447761535645, 6.624478816986084, 6.7851128578186035, 6.945747375488281, 7.106381416320801, 7.26701545715332, 7.42764949798584, 7.588284015655518, 7.748918056488037, 7.909552097320557, 8.070186614990234, 8.230820655822754, 8.391454696655273, 8.552088737487793]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 3.0, 4.0, 8.0, 7.0, 5.0, 13.0, 24.0, 38.0, 44.0, 49.0, 72.0, 95.0, 82.0, 94.0, 85.0, 80.0, 74.0, 61.0, 37.0, 32.0, 26.0, 15.0, 21.0, 10.0, 7.0, 9.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.585054874420166, -2.4972848892211914, -2.409514904022217, -2.321744918823242, -2.2339749336242676, -2.146204948425293, -2.0584349632263184, -1.9706652164459229, -1.8828952312469482, -1.7951252460479736, -1.707355260848999, -1.6195852756500244, -1.5318154096603394, -1.4440454244613647, -1.3562754392623901, -1.268505573272705, -1.180735468864441, -1.0929654836654663, -1.0051954984664917, -0.9174255728721619, -0.829655647277832, -0.7418856620788574, -0.6541156768798828, -0.566345751285553, -0.47857576608657837, -0.39080581068992615, -0.3030358552932739, -0.21526587009429932, -0.1274959146976471, -0.03972595930099487, 0.048044025897979736, 0.13581395149230957, 0.22358393669128418, 0.3113538920879364, 0.3991238474845886, 0.48689383268356323, 0.5746637582778931, 0.6624337434768677, 0.7502037286758423, 0.8379736542701721, 0.9257436394691467, 1.0135135650634766, 1.1012835502624512, 1.1890535354614258, 1.2768235206604004, 1.364593505859375, 1.4523634910583496, 1.5401333570480347, 1.6279033422470093, 1.7156733274459839, 1.8034433126449585, 1.8912131786346436, 1.9789831638336182, 2.0667531490325928, 2.1545231342315674, 2.242293119430542, 2.3300631046295166, 2.417833089828491, 2.505603075027466, 2.5933730602264404, 2.681143045425415, 2.7689127922058105, 2.856682777404785, 2.9444527626037598, 3.0322227478027344]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 6.0, 8.0, 6.0, 15.0, 27.0, 30.0, 45.0, 55.0, 88.0, 117.0, 166.0, 246.0, 351.0, 487.0, 761.0, 1073.0, 1659.0, 2739.0, 4374.0, 7843.0, 14667.0, 33647.0, 117876.0, 547799.0, 221257.0, 49483.0, 19535.0, 9669.0, 5390.0, 3179.0, 1980.0, 1326.0, 812.0, 548.0, 353.0, 281.0, 181.0, 150.0, 94.0, 66.0, 50.0, 28.0, 31.0, 20.0, 13.0, 8.0, 7.0, 9.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0673828125, -1.03369140625, -1.0, -0.96630859375, -0.9326171875, -0.89892578125, -0.865234375, -0.83154296875, -0.7978515625, -0.76416015625, -0.73046875, -0.69677734375, -0.6630859375, -0.62939453125, -0.595703125, -0.56201171875, -0.5283203125, -0.49462890625, -0.4609375, -0.42724609375, -0.3935546875, -0.35986328125, -0.326171875, -0.29248046875, -0.2587890625, -0.22509765625, -0.19140625, -0.15771484375, -0.1240234375, -0.09033203125, -0.056640625, -0.02294921875, 0.0107421875, 0.04443359375, 0.078125, 0.11181640625, 0.1455078125, 0.17919921875, 0.212890625, 0.24658203125, 0.2802734375, 0.31396484375, 0.34765625, 0.38134765625, 0.4150390625, 0.44873046875, 0.482421875, 0.51611328125, 0.5498046875, 0.58349609375, 0.6171875, 0.65087890625, 0.6845703125, 0.71826171875, 0.751953125, 0.78564453125, 0.8193359375, 0.85302734375, 0.88671875, 0.92041015625, 0.9541015625, 0.98779296875, 1.021484375, 1.05517578125, 1.0888671875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 1.0, 6.0, 3.0, 3.0, 10.0, 3.0, 5.0, 4.0, 15.0, 13.0, 13.0, 37.0, 43.0, 68.0, 94.0, 113.0, 126.0, 126.0, 80.0, 65.0, 43.0, 22.0, 22.0, 14.0, 9.0, 8.0, 12.0, 4.0, 9.0, 4.0, 5.0, 3.0, 4.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1741943359375, -0.1686725616455078, -0.16315078735351562, -0.15762901306152344, -0.15210723876953125, -0.14658546447753906, -0.14106369018554688, -0.1355419158935547, -0.1300201416015625, -0.12449836730957031, -0.11897659301757812, -0.11345481872558594, -0.10793304443359375, -0.10241127014160156, -0.09688949584960938, -0.09136772155761719, -0.085845947265625, -0.08032417297363281, -0.07480239868164062, -0.06928062438964844, -0.06375885009765625, -0.05823707580566406, -0.052715301513671875, -0.04719352722167969, -0.0416717529296875, -0.03614997863769531, -0.030628204345703125, -0.025106430053710938, -0.01958465576171875, -0.014062881469726562, -0.008541107177734375, -0.0030193328857421875, 0.00250244140625, 0.008024215698242188, 0.013545989990234375, 0.019067764282226562, 0.02458953857421875, 0.030111312866210938, 0.035633087158203125, 0.04115486145019531, 0.0466766357421875, 0.05219841003417969, 0.057720184326171875, 0.06324195861816406, 0.06876373291015625, 0.07428550720214844, 0.07980728149414062, 0.08532905578613281, 0.090850830078125, 0.09637260437011719, 0.10189437866210938, 0.10741615295410156, 0.11293792724609375, 0.11845970153808594, 0.12398147583007812, 0.1295032501220703, 0.1350250244140625, 0.1405467987060547, 0.14606857299804688, 0.15159034729003906, 0.15711212158203125, 0.16263389587402344, 0.16815567016601562, 0.1736774444580078, 0.17919921875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 10.0, 17.0, 28.0, 92.0, 193.0, 558.0, 1912.0, 8475.0, 48539.0, 393786.0, 518268.0, 62780.0, 10759.0, 2206.0, 599.0, 169.0, 89.0, 25.0, 10.0, 11.0, 8.0, 1.0, 3.0, 1.0, 6.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.44921875, -2.3910064697265625, -2.332794189453125, -2.2745819091796875, -2.21636962890625, -2.1581573486328125, -2.099945068359375, -2.0417327880859375, -1.9835205078125, -1.9253082275390625, -1.867095947265625, -1.8088836669921875, -1.75067138671875, -1.6924591064453125, -1.634246826171875, -1.5760345458984375, -1.517822265625, -1.4596099853515625, -1.401397705078125, -1.3431854248046875, -1.28497314453125, -1.2267608642578125, -1.168548583984375, -1.1103363037109375, -1.0521240234375, -0.9939117431640625, -0.935699462890625, -0.8774871826171875, -0.81927490234375, -0.7610626220703125, -0.702850341796875, -0.6446380615234375, -0.58642578125, -0.5282135009765625, -0.470001220703125, -0.4117889404296875, -0.35357666015625, -0.2953643798828125, -0.237152099609375, -0.1789398193359375, -0.1207275390625, -0.0625152587890625, -0.004302978515625, 0.0539093017578125, 0.11212158203125, 0.1703338623046875, 0.228546142578125, 0.2867584228515625, 0.344970703125, 0.4031829833984375, 0.461395263671875, 0.5196075439453125, 0.57781982421875, 0.6360321044921875, 0.694244384765625, 0.7524566650390625, 0.8106689453125, 0.8688812255859375, 0.927093505859375, 0.9853057861328125, 1.04351806640625, 1.1017303466796875, 1.159942626953125, 1.2181549072265625, 1.2763671875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 5.0, 3.0, 7.0, 4.0, 12.0, 10.0, 13.0, 15.0, 14.0, 25.0, 26.0, 28.0, 23.0, 37.0, 25.0, 43.0, 45.0, 44.0, 43.0, 45.0, 37.0, 32.0, 45.0, 52.0, 47.0, 39.0, 36.0, 39.0, 30.0, 24.0, 29.0, 17.0, 20.0, 18.0, 19.0, 6.0, 14.0, 4.0, 7.0, 8.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.7529296875, -0.7307281494140625, -0.708526611328125, -0.6863250732421875, -0.66412353515625, -0.6419219970703125, -0.619720458984375, -0.5975189208984375, -0.5753173828125, -0.5531158447265625, -0.530914306640625, -0.5087127685546875, -0.48651123046875, -0.4643096923828125, -0.442108154296875, -0.4199066162109375, -0.397705078125, -0.3755035400390625, -0.353302001953125, -0.3311004638671875, -0.30889892578125, -0.2866973876953125, -0.264495849609375, -0.2422943115234375, -0.2200927734375, -0.1978912353515625, -0.175689697265625, -0.1534881591796875, -0.13128662109375, -0.1090850830078125, -0.086883544921875, -0.0646820068359375, -0.04248046875, -0.0202789306640625, 0.001922607421875, 0.0241241455078125, 0.04632568359375, 0.0685272216796875, 0.090728759765625, 0.1129302978515625, 0.1351318359375, 0.1573333740234375, 0.179534912109375, 0.2017364501953125, 0.22393798828125, 0.2461395263671875, 0.268341064453125, 0.2905426025390625, 0.312744140625, 0.3349456787109375, 0.357147216796875, 0.3793487548828125, 0.40155029296875, 0.4237518310546875, 0.445953369140625, 0.4681549072265625, 0.4903564453125, 0.5125579833984375, 0.534759521484375, 0.5569610595703125, 0.57916259765625, 0.6013641357421875, 0.623565673828125, 0.6457672119140625, 0.66796875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 7.0, 21.0, 94.0, 569.0, 36103.0, 1009069.0, 2391.0, 212.0, 44.0, 17.0, 6.0, 3.0, 6.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.1015625, -7.8502197265625, -7.598876953125, -7.3475341796875, -7.09619140625, -6.8448486328125, -6.593505859375, -6.3421630859375, -6.0908203125, -5.8394775390625, -5.588134765625, -5.3367919921875, -5.08544921875, -4.8341064453125, -4.582763671875, -4.3314208984375, -4.080078125, -3.8287353515625, -3.577392578125, -3.3260498046875, -3.07470703125, -2.8233642578125, -2.572021484375, -2.3206787109375, -2.0693359375, -1.8179931640625, -1.566650390625, -1.3153076171875, -1.06396484375, -0.8126220703125, -0.561279296875, -0.3099365234375, -0.05859375, 0.1927490234375, 0.444091796875, 0.6954345703125, 0.94677734375, 1.1981201171875, 1.449462890625, 1.7008056640625, 1.9521484375, 2.2034912109375, 2.454833984375, 2.7061767578125, 2.95751953125, 3.2088623046875, 3.460205078125, 3.7115478515625, 3.962890625, 4.2142333984375, 4.465576171875, 4.7169189453125, 4.96826171875, 5.2196044921875, 5.470947265625, 5.7222900390625, 5.9736328125, 6.2249755859375, 6.476318359375, 6.7276611328125, 6.97900390625, 7.2303466796875, 7.481689453125, 7.7330322265625, 7.984375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 1.0, 6.0, 12.0, 7.0, 9.0, 9.0, 17.0, 38.0, 49.0, 71.0, 103.0, 134.0, 114.0, 111.0, 98.0, 64.0, 59.0, 38.0, 19.0, 13.0, 12.0, 9.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010782480239868164, -0.00010478310286998749, -0.00010174140334129333, -9.869970381259918e-05, -9.565800428390503e-05, -9.261630475521088e-05, -8.957460522651672e-05, -8.653290569782257e-05, -8.349120616912842e-05, -8.044950664043427e-05, -7.740780711174011e-05, -7.436610758304596e-05, -7.13244080543518e-05, -6.828270852565765e-05, -6.52410089969635e-05, -6.219930946826935e-05, -5.9157609939575195e-05, -5.611591041088104e-05, -5.307421088218689e-05, -5.003251135349274e-05, -4.6990811824798584e-05, -4.394911229610443e-05, -4.090741276741028e-05, -3.7865713238716125e-05, -3.482401371002197e-05, -3.178231418132782e-05, -2.8740614652633667e-05, -2.5698915123939514e-05, -2.265721559524536e-05, -1.961551606655121e-05, -1.6573816537857056e-05, -1.3532117009162903e-05, -1.049041748046875e-05, -7.448717951774597e-06, -4.407018423080444e-06, -1.3653188943862915e-06, 1.6763806343078613e-06, 4.718080163002014e-06, 7.759779691696167e-06, 1.080147922039032e-05, 1.3843178749084473e-05, 1.6884878277778625e-05, 1.992657780647278e-05, 2.296827733516693e-05, 2.6009976863861084e-05, 2.9051676392555237e-05, 3.209337592124939e-05, 3.513507544994354e-05, 3.8176774978637695e-05, 4.121847450733185e-05, 4.4260174036026e-05, 4.7301873564720154e-05, 5.034357309341431e-05, 5.338527262210846e-05, 5.642697215080261e-05, 5.9468671679496765e-05, 6.251037120819092e-05, 6.555207073688507e-05, 6.859377026557922e-05, 7.163546979427338e-05, 7.467716932296753e-05, 7.771886885166168e-05, 8.076056838035583e-05, 8.380226790904999e-05, 8.684396743774414e-05]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 7.0, 9.0, 16.0, 38.0, 45.0, 62.0, 105.0, 198.0, 353.0, 675.0, 1488.0, 3448.0, 10119.0, 40093.0, 223842.0, 584376.0, 141574.0, 28359.0, 7979.0, 2989.0, 1319.0, 648.0, 313.0, 164.0, 122.0, 83.0, 46.0, 22.0, 14.0, 13.0, 13.0, 7.0, 5.0, 6.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.86962890625, -0.8389816284179688, -0.8083343505859375, -0.7776870727539062, -0.747039794921875, -0.7163925170898438, -0.6857452392578125, -0.6550979614257812, -0.62445068359375, -0.5938034057617188, -0.5631561279296875, -0.5325088500976562, -0.501861572265625, -0.47121429443359375, -0.4405670166015625, -0.40991973876953125, -0.3792724609375, -0.34862518310546875, -0.3179779052734375, -0.28733062744140625, -0.256683349609375, -0.22603607177734375, -0.1953887939453125, -0.16474151611328125, -0.13409423828125, -0.10344696044921875, -0.0727996826171875, -0.04215240478515625, -0.011505126953125, 0.01914215087890625, 0.0497894287109375, 0.08043670654296875, 0.111083984375, 0.14173126220703125, 0.1723785400390625, 0.20302581787109375, 0.233673095703125, 0.26432037353515625, 0.2949676513671875, 0.32561492919921875, 0.35626220703125, 0.38690948486328125, 0.4175567626953125, 0.44820404052734375, 0.478851318359375, 0.5094985961914062, 0.5401458740234375, 0.5707931518554688, 0.6014404296875, 0.6320877075195312, 0.6627349853515625, 0.6933822631835938, 0.724029541015625, 0.7546768188476562, 0.7853240966796875, 0.8159713745117188, 0.84661865234375, 0.8772659301757812, 0.9079132080078125, 0.9385604858398438, 0.969207763671875, 0.9998550415039062, 1.0305023193359375, 1.0611495971679688, 1.091796875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 5.0, 2.0, 14.0, 10.0, 15.0, 18.0, 37.0, 55.0, 55.0, 57.0, 95.0, 108.0, 114.0, 107.0, 77.0, 66.0, 42.0, 31.0, 28.0, 19.0, 16.0, 12.0, 6.0, 4.0, 4.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6923828125, -0.6668853759765625, -0.641387939453125, -0.6158905029296875, -0.59039306640625, -0.5648956298828125, -0.539398193359375, -0.5139007568359375, -0.4884033203125, -0.4629058837890625, -0.437408447265625, -0.4119110107421875, -0.38641357421875, -0.3609161376953125, -0.335418701171875, -0.3099212646484375, -0.284423828125, -0.2589263916015625, -0.233428955078125, -0.2079315185546875, -0.18243408203125, -0.1569366455078125, -0.131439208984375, -0.1059417724609375, -0.0804443359375, -0.0549468994140625, -0.029449462890625, -0.0039520263671875, 0.02154541015625, 0.0470428466796875, 0.072540283203125, 0.0980377197265625, 0.12353515625, 0.1490325927734375, 0.174530029296875, 0.2000274658203125, 0.22552490234375, 0.2510223388671875, 0.276519775390625, 0.3020172119140625, 0.3275146484375, 0.3530120849609375, 0.378509521484375, 0.4040069580078125, 0.42950439453125, 0.4550018310546875, 0.480499267578125, 0.5059967041015625, 0.531494140625, 0.5569915771484375, 0.582489013671875, 0.6079864501953125, 0.63348388671875, 0.6589813232421875, 0.684478759765625, 0.7099761962890625, 0.7354736328125, 0.7609710693359375, 0.786468505859375, 0.8119659423828125, 0.83746337890625, 0.8629608154296875, 0.888458251953125, 0.9139556884765625, 0.939453125]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 4.0, 1.0, 7.0, 7.0, 34.0, 78.0, 232.0, 359.0, 174.0, 63.0, 24.0, 9.0, 8.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.288938522338867, -12.865629196166992, -12.442319869995117, -12.019010543823242, -11.595702171325684, -11.172392845153809, -10.749083518981934, -10.325774192810059, -9.902464866638184, -9.479155540466309, -9.055846214294434, -8.632537841796875, -8.209228515625, -7.785919189453125, -7.36260986328125, -6.939300537109375, -6.515991687774658, -6.092682361602783, -5.669373512268066, -5.246064186096191, -4.822754859924316, -4.399445533752441, -3.9761366844177246, -3.5528273582458496, -3.1295182704925537, -2.706209182739258, -2.282899856567383, -1.859590768814087, -1.4362815618515015, -1.012972354888916, -0.5896632671356201, -0.16635394096374512, 0.2569551467895508, 0.6802643537521362, 1.1035735607147217, 1.5268826484680176, 1.950191855430603, 2.3735010623931885, 2.7968101501464844, 3.2201194763183594, 3.6434285640716553, 4.066737651824951, 4.490046977996826, 4.913355827331543, 5.336665153503418, 5.759974479675293, 6.183283805847168, 6.606593132019043, 7.02990198135376, 7.453211307525635, 7.876520156860352, 8.299829483032227, 8.723138809204102, 9.146448135375977, 9.569757461547852, 9.993066787719727, 10.416375160217285, 10.83968448638916, 11.262993812561035, 11.686302185058594, 12.109611511230469, 12.532920837402344, 12.956230163574219, 13.379539489746094, 13.802848815917969]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 0.0, 5.0, 3.0, 1.0, 5.0, 1.0, 3.0, 4.0, 9.0, 17.0, 17.0, 21.0, 31.0, 48.0, 63.0, 78.0, 99.0, 126.0, 96.0, 89.0, 80.0, 77.0, 43.0, 25.0, 18.0, 17.0, 6.0, 4.0, 2.0, 2.0, 2.0, 4.0, 4.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-11.368463516235352, -11.058740615844727, -10.749017715454102, -10.43929386138916, -10.129570960998535, -9.81984806060791, -9.510124206542969, -9.200401306152344, -8.890678405761719, -8.580955505371094, -8.271232604980469, -7.961508750915527, -7.651785850524902, -7.342062950134277, -7.032339572906494, -6.722616195678711, -6.412893295288086, -6.103170394897461, -5.793447017669678, -5.4837236404418945, -5.1740007400512695, -4.8642778396606445, -4.554554462432861, -4.244831085205078, -3.935108184814453, -3.625385046005249, -3.315661907196045, -3.005938768386841, -2.6962156295776367, -2.3864924907684326, -2.0767693519592285, -1.7670462131500244, -1.4573240280151367, -1.1476008892059326, -0.8378777503967285, -0.5281546115875244, -0.2184314727783203, 0.09129166603088379, 0.4010148048400879, 0.710737943649292, 1.020461082458496, 1.3301842212677002, 1.6399073600769043, 1.9496304988861084, 2.2593536376953125, 2.5690767765045166, 2.8787999153137207, 3.188523054122925, 3.498246192932129, 3.807969331741333, 4.117692470550537, 4.42741584777832, 4.737138748168945, 5.04686164855957, 5.3565850257873535, 5.666308403015137, 5.976031303405762, 6.285754203796387, 6.59547758102417, 6.905200958251953, 7.214923858642578, 7.524646759033203, 7.834370136260986, 8.14409351348877, 8.453816413879395]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 6.0, 5.0, 3.0, 6.0, 9.0, 15.0, 11.0, 26.0, 30.0, 56.0, 59.0, 89.0, 133.0, 226.0, 287.0, 509.0, 854.0, 1990.0, 4732.0, 18400.0, 533718.0, 3598484.0, 24700.0, 5617.0, 2055.0, 945.0, 476.0, 295.0, 190.0, 108.0, 85.0, 51.0, 38.0, 27.0, 18.0, 10.0, 11.0, 6.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.6171875, -6.43377685546875, -6.2503662109375, -6.06695556640625, -5.883544921875, -5.70013427734375, -5.5167236328125, -5.33331298828125, -5.14990234375, -4.96649169921875, -4.7830810546875, -4.59967041015625, -4.416259765625, -4.23284912109375, -4.0494384765625, -3.86602783203125, -3.6826171875, -3.49920654296875, -3.3157958984375, -3.13238525390625, -2.948974609375, -2.76556396484375, -2.5821533203125, -2.39874267578125, -2.21533203125, -2.03192138671875, -1.8485107421875, -1.66510009765625, -1.481689453125, -1.29827880859375, -1.1148681640625, -0.93145751953125, -0.748046875, -0.56463623046875, -0.3812255859375, -0.19781494140625, -0.014404296875, 0.16900634765625, 0.3524169921875, 0.53582763671875, 0.71923828125, 0.90264892578125, 1.0860595703125, 1.26947021484375, 1.452880859375, 1.63629150390625, 1.8197021484375, 2.00311279296875, 2.1865234375, 2.36993408203125, 2.5533447265625, 2.73675537109375, 2.920166015625, 3.10357666015625, 3.2869873046875, 3.47039794921875, 3.65380859375, 3.83721923828125, 4.0206298828125, 4.20404052734375, 4.387451171875, 4.57086181640625, 4.7542724609375, 4.93768310546875, 5.12109375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 4.0, 5.0, 6.0, 9.0, 12.0, 18.0, 20.0, 29.0, 59.0, 76.0, 107.0, 118.0, 121.0, 106.0, 102.0, 57.0, 45.0, 18.0, 24.0, 8.0, 11.0, 9.0, 8.0, 3.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2193603515625, -0.2125415802001953, -0.20572280883789062, -0.19890403747558594, -0.19208526611328125, -0.18526649475097656, -0.17844772338867188, -0.1716289520263672, -0.1648101806640625, -0.1579914093017578, -0.15117263793945312, -0.14435386657714844, -0.13753509521484375, -0.13071632385253906, -0.12389755249023438, -0.11707878112792969, -0.110260009765625, -0.10344123840332031, -0.09662246704101562, -0.08980369567871094, -0.08298492431640625, -0.07616615295410156, -0.06934738159179688, -0.06252861022949219, -0.0557098388671875, -0.04889106750488281, -0.042072296142578125, -0.03525352478027344, -0.02843475341796875, -0.021615982055664062, -0.014797210693359375, -0.007978439331054688, -0.00115966796875, 0.0056591033935546875, 0.012477874755859375, 0.019296646118164062, 0.02611541748046875, 0.03293418884277344, 0.039752960205078125, 0.04657173156738281, 0.0533905029296875, 0.06020927429199219, 0.06702804565429688, 0.07384681701660156, 0.08066558837890625, 0.08748435974121094, 0.09430313110351562, 0.10112190246582031, 0.107940673828125, 0.11475944519042969, 0.12157821655273438, 0.12839698791503906, 0.13521575927734375, 0.14203453063964844, 0.14885330200195312, 0.1556720733642578, 0.1624908447265625, 0.1693096160888672, 0.17612838745117188, 0.18294715881347656, 0.18976593017578125, 0.19658470153808594, 0.20340347290039062, 0.2102222442626953, 0.217041015625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 5.0, 3.0, 9.0, 6.0, 19.0, 19.0, 31.0, 31.0, 59.0, 78.0, 158.0, 789.0, 333734.0, 3857683.0, 1167.0, 195.0, 89.0, 68.0, 45.0, 33.0, 19.0, 11.0, 9.0, 7.0, 8.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.109375, -12.541015625, -11.97265625, -11.404296875, -10.8359375, -10.267578125, -9.69921875, -9.130859375, -8.5625, -7.994140625, -7.42578125, -6.857421875, -6.2890625, -5.720703125, -5.15234375, -4.583984375, -4.015625, -3.447265625, -2.87890625, -2.310546875, -1.7421875, -1.173828125, -0.60546875, -0.037109375, 0.53125, 1.099609375, 1.66796875, 2.236328125, 2.8046875, 3.373046875, 3.94140625, 4.509765625, 5.078125, 5.646484375, 6.21484375, 6.783203125, 7.3515625, 7.919921875, 8.48828125, 9.056640625, 9.625, 10.193359375, 10.76171875, 11.330078125, 11.8984375, 12.466796875, 13.03515625, 13.603515625, 14.171875, 14.740234375, 15.30859375, 15.876953125, 16.4453125, 17.013671875, 17.58203125, 18.150390625, 18.71875, 19.287109375, 19.85546875, 20.423828125, 20.9921875, 21.560546875, 22.12890625, 22.697265625, 23.265625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 3.0, 18.0, 7.0, 18.0, 24.0, 32.0, 51.0, 83.0, 129.0, 219.0, 441.0, 1678.0, 713.0, 257.0, 124.0, 75.0, 52.0, 42.0, 32.0, 25.0, 12.0, 10.0, 7.0, 5.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.5732421875, -0.5584335327148438, -0.5436248779296875, -0.5288162231445312, -0.514007568359375, -0.49919891357421875, -0.4843902587890625, -0.46958160400390625, -0.45477294921875, -0.43996429443359375, -0.4251556396484375, -0.41034698486328125, -0.395538330078125, -0.38072967529296875, -0.3659210205078125, -0.35111236572265625, -0.3363037109375, -0.32149505615234375, -0.3066864013671875, -0.29187774658203125, -0.277069091796875, -0.26226043701171875, -0.2474517822265625, -0.23264312744140625, -0.21783447265625, -0.20302581787109375, -0.1882171630859375, -0.17340850830078125, -0.158599853515625, -0.14379119873046875, -0.1289825439453125, -0.11417388916015625, -0.099365234375, -0.08455657958984375, -0.0697479248046875, -0.05493927001953125, -0.040130615234375, -0.02532196044921875, -0.0105133056640625, 0.00429534912109375, 0.01910400390625, 0.03391265869140625, 0.0487213134765625, 0.06352996826171875, 0.078338623046875, 0.09314727783203125, 0.1079559326171875, 0.12276458740234375, 0.1375732421875, 0.15238189697265625, 0.1671905517578125, 0.18199920654296875, 0.196807861328125, 0.21161651611328125, 0.2264251708984375, 0.24123382568359375, 0.25604248046875, 0.27085113525390625, 0.2856597900390625, 0.30046844482421875, 0.315277099609375, 0.33008575439453125, 0.3448944091796875, 0.35970306396484375, 0.37451171875]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 4.0, 3.0, 7.0, 6.0, 15.0, 22.0, 19.0, 29.0, 62.0, 88.0, 173.0, 159.0, 143.0, 104.0, 68.0, 34.0, 24.0, 12.0, 10.0, 9.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.378148317337036, -2.3036506175994873, -2.2291531562805176, -2.1546554565429688, -2.08015775680542, -2.00566029548645, -1.9311625957489014, -1.856665015220642, -1.7821674346923828, -1.7076698541641235, -1.6331722736358643, -1.5586745738983154, -1.4841769933700562, -1.4096794128417969, -1.335181713104248, -1.2606841325759888, -1.1861865520477295, -1.1116889715194702, -1.037191390991211, -0.9626936912536621, -0.8881961107254028, -0.8136985301971436, -0.7392008900642395, -0.6647032499313354, -0.5902056694030762, -0.5157080888748169, -0.44121044874191284, -0.3667128384113312, -0.2922152280807495, -0.21771761775016785, -0.14322000741958618, -0.06872236728668213, 0.005774974822998047, 0.08027258515357971, 0.15477019548416138, 0.22926780581474304, 0.3037654161453247, 0.37826302647590637, 0.45276063680648804, 0.5272582769393921, 0.6017558574676514, 0.6762534379959106, 0.7507510781288147, 0.8252487182617188, 0.899746298789978, 0.9742438793182373, 1.0487415790557861, 1.1232391595840454, 1.1977367401123047, 1.272234320640564, 1.3467319011688232, 1.421229600906372, 1.4957271814346313, 1.5702247619628906, 1.6447224617004395, 1.7192200422286987, 1.793717622756958, 1.8682152032852173, 1.9427127838134766, 2.0172104835510254, 2.091708183288574, 2.166205644607544, 2.2407033443450928, 2.3152008056640625, 2.3896985054016113]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 6.0, 6.0, 6.0, 12.0, 19.0, 22.0, 18.0, 26.0, 35.0, 41.0, 38.0, 48.0, 57.0, 67.0, 67.0, 52.0, 66.0, 65.0, 55.0, 51.0, 56.0, 47.0, 30.0, 19.0, 22.0, 16.0, 17.0, 8.0, 5.0, 8.0, 4.0, 5.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7533705234527588, -1.6853567361831665, -1.6173430681228638, -1.5493292808532715, -1.4813156127929688, -1.4133018255233765, -1.3452880382537842, -1.2772743701934814, -1.2092607021331787, -1.1412469148635864, -1.0732332468032837, -1.0052194595336914, -0.9372057914733887, -0.8691920042037964, -0.8011782765388489, -0.7331645488739014, -0.6651507616043091, -0.5971370339393616, -0.5291233062744141, -0.46110954880714417, -0.39309582114219666, -0.32508209347724915, -0.25706833600997925, -0.18905460834503174, -0.12104088068008423, -0.05302714556455612, 0.014986589550971985, 0.08300033211708069, 0.1510140597820282, 0.2190277874469757, 0.2870415449142456, 0.3550552725791931, 0.4230690002441406, 0.49108272790908813, 0.5590964555740356, 0.6271102428436279, 0.6951239109039307, 0.763137698173523, 0.8311514258384705, 0.899165153503418, 0.9671788811683655, 1.035192608833313, 1.1032063961029053, 1.171220064163208, 1.2392338514328003, 1.307247519493103, 1.3752613067626953, 1.443274974822998, 1.5112887620925903, 1.5793025493621826, 1.6473162174224854, 1.7153300046920776, 1.7833436727523804, 1.8513574600219727, 1.9193711280822754, 1.9873849153518677, 2.05539870262146, 2.1234123706817627, 2.1914262771606445, 2.2594399452209473, 2.32745361328125, 2.3954672813415527, 2.4634811878204346, 2.5314948558807373, 2.59950852394104]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 2.0, 10.0, 6.0, 10.0, 14.0, 20.0, 30.0, 41.0, 52.0, 82.0, 131.0, 186.0, 320.0, 461.0, 900.0, 1833.0, 4715.0, 16211.0, 99137.0, 705809.0, 183069.0, 24219.0, 6231.0, 2336.0, 1087.0, 611.0, 349.0, 218.0, 142.0, 107.0, 79.0, 41.0, 22.0, 24.0, 13.0, 10.0, 6.0, 4.0, 2.0, 5.0, 0.0, 4.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0, 1.0], "bins": [-2.478515625, -2.404815673828125, -2.33111572265625, -2.257415771484375, -2.1837158203125, -2.110015869140625, -2.03631591796875, -1.962615966796875, -1.888916015625, -1.815216064453125, -1.74151611328125, -1.667816162109375, -1.5941162109375, -1.520416259765625, -1.44671630859375, -1.373016357421875, -1.29931640625, -1.225616455078125, -1.15191650390625, -1.078216552734375, -1.0045166015625, -0.930816650390625, -0.85711669921875, -0.783416748046875, -0.709716796875, -0.636016845703125, -0.56231689453125, -0.488616943359375, -0.4149169921875, -0.341217041015625, -0.26751708984375, -0.193817138671875, -0.1201171875, -0.046417236328125, 0.02728271484375, 0.100982666015625, 0.1746826171875, 0.248382568359375, 0.32208251953125, 0.395782470703125, 0.469482421875, 0.543182373046875, 0.61688232421875, 0.690582275390625, 0.7642822265625, 0.837982177734375, 0.91168212890625, 0.985382080078125, 1.05908203125, 1.132781982421875, 1.20648193359375, 1.280181884765625, 1.3538818359375, 1.427581787109375, 1.50128173828125, 1.574981689453125, 1.648681640625, 1.722381591796875, 1.79608154296875, 1.869781494140625, 1.9434814453125, 2.017181396484375, 2.09088134765625, 2.164581298828125, 2.23828125]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 7.0, 3.0, 6.0, 7.0, 14.0, 21.0, 35.0, 67.0, 69.0, 99.0, 116.0, 135.0, 114.0, 103.0, 69.0, 50.0, 26.0, 19.0, 18.0, 8.0, 7.0, 6.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.210205078125, -0.20248031616210938, -0.19475555419921875, -0.18703079223632812, -0.1793060302734375, -0.17158126831054688, -0.16385650634765625, -0.15613174438476562, -0.148406982421875, -0.14068222045898438, -0.13295745849609375, -0.12523269653320312, -0.1175079345703125, -0.10978317260742188, -0.10205841064453125, -0.09433364868164062, -0.08660888671875, -0.07888412475585938, -0.07115936279296875, -0.06343460083007812, -0.0557098388671875, -0.047985076904296875, -0.04026031494140625, -0.032535552978515625, -0.024810791015625, -0.017086029052734375, -0.00936126708984375, -0.001636505126953125, 0.0060882568359375, 0.013813018798828125, 0.02153778076171875, 0.029262542724609375, 0.0369873046875, 0.044712066650390625, 0.05243682861328125, 0.060161590576171875, 0.0678863525390625, 0.07561111450195312, 0.08333587646484375, 0.09106063842773438, 0.098785400390625, 0.10651016235351562, 0.11423492431640625, 0.12195968627929688, 0.1296844482421875, 0.13740921020507812, 0.14513397216796875, 0.15285873413085938, 0.16058349609375, 0.16830825805664062, 0.17603302001953125, 0.18375778198242188, 0.1914825439453125, 0.19920730590820312, 0.20693206787109375, 0.21465682983398438, 0.222381591796875, 0.23010635375976562, 0.23783111572265625, 0.24555587768554688, 0.2532806396484375, 0.2610054016113281, 0.26873016357421875, 0.2764549255371094, 0.2841796875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 6.0, 7.0, 8.0, 14.0, 21.0, 27.0, 37.0, 54.0, 90.0, 110.0, 179.0, 247.0, 421.0, 605.0, 1013.0, 1685.0, 2929.0, 5146.0, 9695.0, 18800.0, 38538.0, 87884.0, 233314.0, 356271.0, 164350.0, 64836.0, 29671.0, 14534.0, 7522.0, 4219.0, 2426.0, 1386.0, 909.0, 567.0, 329.0, 205.0, 158.0, 105.0, 75.0, 51.0, 31.0, 23.0, 17.0, 14.0, 7.0, 9.0, 5.0, 5.0, 3.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.07421875, -1.0375823974609375, -1.000946044921875, -0.9643096923828125, -0.92767333984375, -0.8910369873046875, -0.854400634765625, -0.8177642822265625, -0.7811279296875, -0.7444915771484375, -0.707855224609375, -0.6712188720703125, -0.63458251953125, -0.5979461669921875, -0.561309814453125, -0.5246734619140625, -0.488037109375, -0.4514007568359375, -0.414764404296875, -0.3781280517578125, -0.34149169921875, -0.3048553466796875, -0.268218994140625, -0.2315826416015625, -0.1949462890625, -0.1583099365234375, -0.121673583984375, -0.0850372314453125, -0.04840087890625, -0.0117645263671875, 0.024871826171875, 0.0615081787109375, 0.09814453125, 0.1347808837890625, 0.171417236328125, 0.2080535888671875, 0.24468994140625, 0.2813262939453125, 0.317962646484375, 0.3545989990234375, 0.3912353515625, 0.4278717041015625, 0.464508056640625, 0.5011444091796875, 0.53778076171875, 0.5744171142578125, 0.611053466796875, 0.6476898193359375, 0.684326171875, 0.7209625244140625, 0.757598876953125, 0.7942352294921875, 0.83087158203125, 0.8675079345703125, 0.904144287109375, 0.9407806396484375, 0.9774169921875, 1.0140533447265625, 1.050689697265625, 1.0873260498046875, 1.12396240234375, 1.1605987548828125, 1.197235107421875, 1.2338714599609375, 1.2705078125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 1.0, 5.0, 2.0, 7.0, 7.0, 8.0, 7.0, 8.0, 5.0, 17.0, 21.0, 22.0, 18.0, 24.0, 21.0, 37.0, 41.0, 25.0, 46.0, 46.0, 33.0, 41.0, 55.0, 60.0, 37.0, 53.0, 34.0, 35.0, 39.0, 32.0, 25.0, 28.0, 35.0, 29.0, 24.0, 14.0, 12.0, 16.0, 4.0, 7.0, 6.0, 3.0, 4.0, 6.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.92138671875, -0.8895187377929688, -0.8576507568359375, -0.8257827758789062, -0.793914794921875, -0.7620468139648438, -0.7301788330078125, -0.6983108520507812, -0.66644287109375, -0.6345748901367188, -0.6027069091796875, -0.5708389282226562, -0.538970947265625, -0.5071029663085938, -0.4752349853515625, -0.44336700439453125, -0.4114990234375, -0.37963104248046875, -0.3477630615234375, -0.31589508056640625, -0.284027099609375, -0.25215911865234375, -0.2202911376953125, -0.18842315673828125, -0.15655517578125, -0.12468719482421875, -0.0928192138671875, -0.06095123291015625, -0.029083251953125, 0.00278472900390625, 0.0346527099609375, 0.06652069091796875, 0.098388671875, 0.13025665283203125, 0.1621246337890625, 0.19399261474609375, 0.225860595703125, 0.25772857666015625, 0.2895965576171875, 0.32146453857421875, 0.35333251953125, 0.38520050048828125, 0.4170684814453125, 0.44893646240234375, 0.480804443359375, 0.5126724243164062, 0.5445404052734375, 0.5764083862304688, 0.6082763671875, 0.6401443481445312, 0.6720123291015625, 0.7038803100585938, 0.735748291015625, 0.7676162719726562, 0.7994842529296875, 0.8313522338867188, 0.86322021484375, 0.8950881958007812, 0.9269561767578125, 0.9588241577148438, 0.990692138671875, 1.0225601196289062, 1.0544281005859375, 1.0862960815429688, 1.1181640625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 2.0, 6.0, 7.0, 6.0, 12.0, 13.0, 31.0, 36.0, 52.0, 67.0, 125.0, 199.0, 372.0, 735.0, 1617.0, 4382.0, 16346.0, 108219.0, 674712.0, 206463.0, 25172.0, 5849.0, 2118.0, 894.0, 437.0, 253.0, 148.0, 89.0, 63.0, 31.0, 32.0, 14.0, 18.0, 9.0, 8.0, 9.0, 5.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.505859375, -1.459716796875, -1.41357421875, -1.367431640625, -1.3212890625, -1.275146484375, -1.22900390625, -1.182861328125, -1.13671875, -1.090576171875, -1.04443359375, -0.998291015625, -0.9521484375, -0.906005859375, -0.85986328125, -0.813720703125, -0.767578125, -0.721435546875, -0.67529296875, -0.629150390625, -0.5830078125, -0.536865234375, -0.49072265625, -0.444580078125, -0.3984375, -0.352294921875, -0.30615234375, -0.260009765625, -0.2138671875, -0.167724609375, -0.12158203125, -0.075439453125, -0.029296875, 0.016845703125, 0.06298828125, 0.109130859375, 0.1552734375, 0.201416015625, 0.24755859375, 0.293701171875, 0.33984375, 0.385986328125, 0.43212890625, 0.478271484375, 0.5244140625, 0.570556640625, 0.61669921875, 0.662841796875, 0.708984375, 0.755126953125, 0.80126953125, 0.847412109375, 0.8935546875, 0.939697265625, 0.98583984375, 1.031982421875, 1.078125, 1.124267578125, 1.17041015625, 1.216552734375, 1.2626953125, 1.308837890625, 1.35498046875, 1.401123046875, 1.447265625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 5.0, 6.0, 9.0, 13.0, 12.0, 24.0, 19.0, 34.0, 43.0, 51.0, 64.0, 67.0, 100.0, 110.0, 93.0, 71.0, 59.0, 46.0, 36.0, 31.0, 30.0, 20.0, 17.0, 15.0, 5.0, 4.0, 5.0, 7.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00013208389282226562, -0.00012873392552137375, -0.00012538395822048187, -0.00012203399091959, -0.00011868402361869812, -0.00011533405631780624, -0.00011198408901691437, -0.00010863412171602249, -0.00010528415441513062, -0.00010193418711423874, -9.858421981334686e-05, -9.523425251245499e-05, -9.188428521156311e-05, -8.853431791067123e-05, -8.518435060977936e-05, -8.183438330888748e-05, -7.84844160079956e-05, -7.513444870710373e-05, -7.178448140621185e-05, -6.843451410531998e-05, -6.50845468044281e-05, -6.173457950353622e-05, -5.838461220264435e-05, -5.503464490175247e-05, -5.1684677600860596e-05, -4.833471029996872e-05, -4.498474299907684e-05, -4.163477569818497e-05, -3.828480839729309e-05, -3.4934841096401215e-05, -3.158487379550934e-05, -2.8234906494617462e-05, -2.4884939193725586e-05, -2.153497189283371e-05, -1.8185004591941833e-05, -1.4835037291049957e-05, -1.1485069990158081e-05, -8.135102689266205e-06, -4.785135388374329e-06, -1.4351680874824524e-06, 1.914799213409424e-06, 5.2647665143013e-06, 8.614733815193176e-06, 1.1964701116085052e-05, 1.531466841697693e-05, 1.8664635717868805e-05, 2.201460301876068e-05, 2.5364570319652557e-05, 2.8714537620544434e-05, 3.206450492143631e-05, 3.5414472222328186e-05, 3.876443952322006e-05, 4.211440682411194e-05, 4.5464374125003815e-05, 4.881434142589569e-05, 5.216430872678757e-05, 5.551427602767944e-05, 5.886424332857132e-05, 6.22142106294632e-05, 6.556417793035507e-05, 6.891414523124695e-05, 7.226411253213882e-05, 7.56140798330307e-05, 7.896404713392258e-05, 8.231401443481445e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 1.0, 5.0, 6.0, 7.0, 10.0, 14.0, 24.0, 28.0, 63.0, 98.0, 195.0, 362.0, 912.0, 2739.0, 12808.0, 245221.0, 748810.0, 30382.0, 4399.0, 1324.0, 527.0, 268.0, 132.0, 96.0, 34.0, 26.0, 19.0, 18.0, 8.0, 6.0, 4.0, 5.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.58203125, -2.504241943359375, -2.42645263671875, -2.348663330078125, -2.2708740234375, -2.193084716796875, -2.11529541015625, -2.037506103515625, -1.959716796875, -1.881927490234375, -1.80413818359375, -1.726348876953125, -1.6485595703125, -1.570770263671875, -1.49298095703125, -1.415191650390625, -1.33740234375, -1.259613037109375, -1.18182373046875, -1.104034423828125, -1.0262451171875, -0.948455810546875, -0.87066650390625, -0.792877197265625, -0.715087890625, -0.637298583984375, -0.55950927734375, -0.481719970703125, -0.4039306640625, -0.326141357421875, -0.24835205078125, -0.170562744140625, -0.0927734375, -0.014984130859375, 0.06280517578125, 0.140594482421875, 0.2183837890625, 0.296173095703125, 0.37396240234375, 0.451751708984375, 0.529541015625, 0.607330322265625, 0.68511962890625, 0.762908935546875, 0.8406982421875, 0.918487548828125, 0.99627685546875, 1.074066162109375, 1.15185546875, 1.229644775390625, 1.30743408203125, 1.385223388671875, 1.4630126953125, 1.540802001953125, 1.61859130859375, 1.696380615234375, 1.774169921875, 1.851959228515625, 1.92974853515625, 2.007537841796875, 2.0853271484375, 2.163116455078125, 2.24090576171875, 2.318695068359375, 2.396484375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 3.0, 11.0, 12.0, 27.0, 42.0, 49.0, 82.0, 102.0, 144.0, 141.0, 138.0, 76.0, 76.0, 44.0, 24.0, 13.0, 5.0, 10.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6318359375, -0.6004791259765625, -0.569122314453125, -0.5377655029296875, -0.50640869140625, -0.4750518798828125, -0.443695068359375, -0.4123382568359375, -0.3809814453125, -0.3496246337890625, -0.318267822265625, -0.2869110107421875, -0.25555419921875, -0.2241973876953125, -0.192840576171875, -0.1614837646484375, -0.130126953125, -0.0987701416015625, -0.067413330078125, -0.0360565185546875, -0.00469970703125, 0.0266571044921875, 0.058013916015625, 0.0893707275390625, 0.1207275390625, 0.1520843505859375, 0.183441162109375, 0.2147979736328125, 0.24615478515625, 0.2775115966796875, 0.308868408203125, 0.3402252197265625, 0.37158203125, 0.4029388427734375, 0.434295654296875, 0.4656524658203125, 0.49700927734375, 0.5283660888671875, 0.559722900390625, 0.5910797119140625, 0.6224365234375, 0.6537933349609375, 0.685150146484375, 0.7165069580078125, 0.74786376953125, 0.7792205810546875, 0.810577392578125, 0.8419342041015625, 0.873291015625, 0.9046478271484375, 0.936004638671875, 0.9673614501953125, 0.99871826171875, 1.0300750732421875, 1.061431884765625, 1.0927886962890625, 1.1241455078125, 1.1555023193359375, 1.186859130859375, 1.2182159423828125, 1.24957275390625, 1.2809295654296875, 1.312286376953125, 1.3436431884765625, 1.375]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 0.0, 2.0, 2.0, 7.0, 9.0, 4.0, 8.0, 14.0, 25.0, 53.0, 83.0, 138.0, 201.0, 191.0, 122.0, 57.0, 30.0, 21.0, 13.0, 10.0, 7.0, 3.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.404948234558105, -10.979870796203613, -10.554794311523438, -10.129716873168945, -9.704639434814453, -9.279562950134277, -8.854485511779785, -8.42940902709961, -8.004331588745117, -7.579254627227783, -7.154177665710449, -6.729100227355957, -6.304023265838623, -5.878946304321289, -5.453868865966797, -5.028791904449463, -4.603714942932129, -4.178637981414795, -3.753560781478882, -3.3284835815429688, -2.9034066200256348, -2.478329658508301, -2.0532524585723877, -1.6281752586364746, -1.2030982971191406, -0.7780212163925171, -0.35294413566589355, 0.07213294506072998, 0.4972100257873535, 0.9222869873046875, 1.3473641872406006, 1.7724413871765137, 2.197519302368164, 2.622596263885498, 3.047673463821411, 3.472750663757324, 3.897827625274658, 4.322904586791992, 4.747982025146484, 5.173058986663818, 5.598135948181152, 6.023212909698486, 6.44828987121582, 6.8733673095703125, 7.2984442710876465, 7.7235212326049805, 8.148598670959473, 8.573675155639648, 8.99875259399414, 9.423830032348633, 9.848906517028809, 10.2739839553833, 10.699060440063477, 11.124137878417969, 11.549215316772461, 11.974292755126953, 12.399369239807129, 12.824446678161621, 13.249523162841797, 13.674600601196289, 14.099678039550781, 14.524754524230957, 14.94983196258545, 15.374908447265625, 15.799985885620117]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 8.0, 9.0, 15.0, 15.0, 25.0, 40.0, 37.0, 45.0, 85.0, 65.0, 84.0, 83.0, 81.0, 90.0, 82.0, 61.0, 43.0, 40.0, 19.0, 19.0, 14.0, 16.0, 11.0, 7.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.438114166259766, -13.978090286254883, -13.518067359924316, -13.058043479919434, -12.598020553588867, -12.137996673583984, -11.677972793579102, -11.217948913574219, -10.757925987243652, -10.29790210723877, -9.837879180908203, -9.37785530090332, -8.917831420898438, -8.457808494567871, -7.997784614562988, -7.537761211395264, -7.077737808227539, -6.6177144050598145, -6.15769100189209, -5.697667121887207, -5.237643718719482, -4.777620315551758, -4.317596435546875, -3.8575730323791504, -3.397549629211426, -2.937526226043701, -2.4775025844573975, -2.0174789428710938, -1.5574555397033691, -1.0974321365356445, -0.6374084949493408, -0.1773848533630371, 0.2826385498046875, 0.7426620721817017, 1.2026855945587158, 1.66270911693573, 2.122732639312744, 2.5827560424804688, 3.0427796840667725, 3.502803325653076, 3.962826728820801, 4.422850131988525, 4.88287353515625, 5.342897415161133, 5.802920818328857, 6.262944221496582, 6.722968101501465, 7.1829915046691895, 7.643014907836914, 8.103038787841797, 8.563061714172363, 9.023085594177246, 9.483108520507812, 9.943132400512695, 10.403156280517578, 10.863180160522461, 11.323203086853027, 11.78322696685791, 12.243249893188477, 12.70327377319336, 13.163297653198242, 13.623320579528809, 14.083344459533691, 14.543367385864258, 15.00339126586914]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 8.0, 5.0, 16.0, 22.0, 39.0, 96.0, 187.0, 373.0, 1015.0, 4843.0, 242356.0, 3936734.0, 6964.0, 1058.0, 333.0, 124.0, 50.0, 27.0, 14.0, 9.0, 7.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-22.390625, -21.786865234375, -21.18310546875, -20.579345703125, -19.9755859375, -19.371826171875, -18.76806640625, -18.164306640625, -17.560546875, -16.956787109375, -16.35302734375, -15.749267578125, -15.1455078125, -14.541748046875, -13.93798828125, -13.334228515625, -12.73046875, -12.126708984375, -11.52294921875, -10.919189453125, -10.3154296875, -9.711669921875, -9.10791015625, -8.504150390625, -7.900390625, -7.296630859375, -6.69287109375, -6.089111328125, -5.4853515625, -4.881591796875, -4.27783203125, -3.674072265625, -3.0703125, -2.466552734375, -1.86279296875, -1.259033203125, -0.6552734375, -0.051513671875, 0.55224609375, 1.156005859375, 1.759765625, 2.363525390625, 2.96728515625, 3.571044921875, 4.1748046875, 4.778564453125, 5.38232421875, 5.986083984375, 6.58984375, 7.193603515625, 7.79736328125, 8.401123046875, 9.0048828125, 9.608642578125, 10.21240234375, 10.816162109375, 11.419921875, 12.023681640625, 12.62744140625, 13.231201171875, 13.8349609375, 14.438720703125, 15.04248046875, 15.646240234375, 16.25]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 7.0, 9.0, 19.0, 30.0, 31.0, 70.0, 92.0, 117.0, 142.0, 130.0, 118.0, 87.0, 46.0, 39.0, 22.0, 12.0, 8.0, 9.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.55029296875, -0.5353240966796875, -0.520355224609375, -0.5053863525390625, -0.49041748046875, -0.4754486083984375, -0.460479736328125, -0.4455108642578125, -0.4305419921875, -0.4155731201171875, -0.400604248046875, -0.3856353759765625, -0.37066650390625, -0.3556976318359375, -0.340728759765625, -0.3257598876953125, -0.310791015625, -0.2958221435546875, -0.280853271484375, -0.2658843994140625, -0.25091552734375, -0.2359466552734375, -0.220977783203125, -0.2060089111328125, -0.1910400390625, -0.1760711669921875, -0.161102294921875, -0.1461334228515625, -0.13116455078125, -0.1161956787109375, -0.101226806640625, -0.0862579345703125, -0.0712890625, -0.0563201904296875, -0.041351318359375, -0.0263824462890625, -0.01141357421875, 0.0035552978515625, 0.018524169921875, 0.0334930419921875, 0.0484619140625, 0.0634307861328125, 0.078399658203125, 0.0933685302734375, 0.10833740234375, 0.1233062744140625, 0.138275146484375, 0.1532440185546875, 0.168212890625, 0.1831817626953125, 0.198150634765625, 0.2131195068359375, 0.22808837890625, 0.2430572509765625, 0.258026123046875, 0.2729949951171875, 0.2879638671875, 0.3029327392578125, 0.317901611328125, 0.3328704833984375, 0.34783935546875, 0.3628082275390625, 0.377777099609375, 0.3927459716796875, 0.40771484375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 6.0, 2.0, 4.0, 6.0, 12.0, 12.0, 35.0, 46.0, 56.0, 126.0, 232.0, 657.0, 2711.0, 23682.0, 3856970.0, 297438.0, 9935.0, 1478.0, 403.0, 176.0, 112.0, 56.0, 43.0, 31.0, 34.0, 8.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.42578125, -5.17718505859375, -4.9285888671875, -4.67999267578125, -4.431396484375, -4.18280029296875, -3.9342041015625, -3.68560791015625, -3.43701171875, -3.18841552734375, -2.9398193359375, -2.69122314453125, -2.442626953125, -2.19403076171875, -1.9454345703125, -1.69683837890625, -1.4482421875, -1.19964599609375, -0.9510498046875, -0.70245361328125, -0.453857421875, -0.20526123046875, 0.0433349609375, 0.29193115234375, 0.54052734375, 0.78912353515625, 1.0377197265625, 1.28631591796875, 1.534912109375, 1.78350830078125, 2.0321044921875, 2.28070068359375, 2.529296875, 2.77789306640625, 3.0264892578125, 3.27508544921875, 3.523681640625, 3.77227783203125, 4.0208740234375, 4.26947021484375, 4.51806640625, 4.76666259765625, 5.0152587890625, 5.26385498046875, 5.512451171875, 5.76104736328125, 6.0096435546875, 6.25823974609375, 6.5068359375, 6.75543212890625, 7.0040283203125, 7.25262451171875, 7.501220703125, 7.74981689453125, 7.9984130859375, 8.24700927734375, 8.49560546875, 8.74420166015625, 8.9927978515625, 9.24139404296875, 9.489990234375, 9.73858642578125, 9.9871826171875, 10.23577880859375, 10.484375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 6.0, 4.0, 4.0, 9.0, 9.0, 9.0, 19.0, 28.0, 36.0, 62.0, 68.0, 147.0, 348.0, 1751.0, 915.0, 263.0, 132.0, 76.0, 42.0, 41.0, 25.0, 21.0, 17.0, 10.0, 5.0, 6.0, 5.0, 1.0, 5.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.7177734375, -0.6959381103515625, -0.674102783203125, -0.6522674560546875, -0.63043212890625, -0.6085968017578125, -0.586761474609375, -0.5649261474609375, -0.5430908203125, -0.5212554931640625, -0.499420166015625, -0.4775848388671875, -0.45574951171875, -0.4339141845703125, -0.412078857421875, -0.3902435302734375, -0.368408203125, -0.3465728759765625, -0.324737548828125, -0.3029022216796875, -0.28106689453125, -0.2592315673828125, -0.237396240234375, -0.2155609130859375, -0.1937255859375, -0.1718902587890625, -0.150054931640625, -0.1282196044921875, -0.10638427734375, -0.0845489501953125, -0.062713623046875, -0.0408782958984375, -0.01904296875, 0.0027923583984375, 0.024627685546875, 0.0464630126953125, 0.06829833984375, 0.0901336669921875, 0.111968994140625, 0.1338043212890625, 0.1556396484375, 0.1774749755859375, 0.199310302734375, 0.2211456298828125, 0.24298095703125, 0.2648162841796875, 0.286651611328125, 0.3084869384765625, 0.330322265625, 0.3521575927734375, 0.373992919921875, 0.3958282470703125, 0.41766357421875, 0.4394989013671875, 0.461334228515625, 0.4831695556640625, 0.5050048828125, 0.5268402099609375, 0.548675537109375, 0.5705108642578125, 0.59234619140625, 0.6141815185546875, 0.636016845703125, 0.6578521728515625, 0.6796875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 16.0, 98.0, 535.0, 302.0, 44.0, 12.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.450634002685547, -20.897205352783203, -20.34377670288086, -19.790348052978516, -19.236919403076172, -18.683490753173828, -18.130062103271484, -17.57663345336914, -17.023204803466797, -16.469776153564453, -15.91634750366211, -15.362918853759766, -14.809490203857422, -14.256061553955078, -13.702632904052734, -13.14920425415039, -12.59577465057373, -12.042346000671387, -11.488917350769043, -10.9354887008667, -10.382060050964355, -9.828631401062012, -9.275201797485352, -8.721773147583008, -8.168344497680664, -7.61491584777832, -7.061487197875977, -6.508058547973633, -5.954629898071289, -5.401201248168945, -4.847772121429443, -4.2943434715271, -3.740915298461914, -3.1874866485595703, -2.6340579986572266, -2.0806291103363037, -1.52720046043396, -0.9737718105316162, -0.42034292221069336, 0.1330857276916504, 0.6865143775939941, 1.239943027496338, 1.7933717966079712, 2.3468005657196045, 2.9002292156219482, 3.453657865524292, 4.007086753845215, 4.560515403747559, 5.113944053649902, 5.667372703552246, 6.22080135345459, 6.774230003356934, 7.327658653259277, 7.881087303161621, 8.434516906738281, 8.987945556640625, 9.541374206542969, 10.094802856445312, 10.648231506347656, 11.20166015625, 11.755088806152344, 12.308517456054688, 12.861946105957031, 13.415374755859375, 13.968803405761719]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 11.0, 14.0, 18.0, 20.0, 28.0, 34.0, 47.0, 55.0, 54.0, 61.0, 71.0, 62.0, 60.0, 71.0, 66.0, 54.0, 50.0, 55.0, 39.0, 24.0, 26.0, 24.0, 20.0, 11.0, 11.0, 7.0, 4.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.167453289031982, -4.066217422485352, -3.9649815559387207, -3.86374568939209, -3.76250958442688, -3.661273717880249, -3.560037851333618, -3.4588019847869873, -3.3575661182403564, -3.2563302516937256, -3.1550943851470947, -3.0538582801818848, -2.952622413635254, -2.851386547088623, -2.750150680541992, -2.6489148139953613, -2.5476789474487305, -2.4464430809020996, -2.3452072143554688, -2.243971347808838, -2.142735242843628, -2.041499376296997, -1.9402635097503662, -1.8390276432037354, -1.7377915382385254, -1.6365556716918945, -1.5353196859359741, -1.4340838193893433, -1.3328479528427124, -1.231611967086792, -1.1303761005401611, -1.0291402339935303, -0.9279043674468994, -0.8266684412956238, -0.7254325747489929, -0.6241966485977173, -0.5229607820510864, -0.4217248558998108, -0.32048892974853516, -0.2192530632019043, -0.11801713705062866, -0.016781233251094818, 0.08445467054843903, 0.18569058179855347, 0.2869264781475067, 0.38816237449645996, 0.4893983006477356, 0.5906341671943665, 0.6918700933456421, 0.7931060194969177, 0.8943418860435486, 0.9955778121948242, 1.096813678741455, 1.198049545288086, 1.2992855310440063, 1.4005213975906372, 1.5017573833465576, 1.6029932498931885, 1.7042292356491089, 1.8054651021957397, 1.9067009687423706, 2.007936954498291, 2.109172821044922, 2.2104086875915527, 2.3116445541381836]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 2.0, 7.0, 2.0, 10.0, 8.0, 8.0, 7.0, 12.0, 22.0, 37.0, 34.0, 45.0, 55.0, 73.0, 101.0, 153.0, 206.0, 309.0, 478.0, 747.0, 1253.0, 2759.0, 7521.0, 32104.0, 267888.0, 631366.0, 80394.0, 13965.0, 4194.0, 1904.0, 942.0, 606.0, 363.0, 259.0, 192.0, 135.0, 97.0, 81.0, 49.0, 34.0, 29.0, 31.0, 22.0, 16.0, 5.0, 12.0, 6.0, 1.0, 7.0, 1.0, 6.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.8671875, -2.769134521484375, -2.67108154296875, -2.573028564453125, -2.4749755859375, -2.376922607421875, -2.27886962890625, -2.180816650390625, -2.082763671875, -1.984710693359375, -1.88665771484375, -1.788604736328125, -1.6905517578125, -1.592498779296875, -1.49444580078125, -1.396392822265625, -1.29833984375, -1.200286865234375, -1.10223388671875, -1.004180908203125, -0.9061279296875, -0.808074951171875, -0.71002197265625, -0.611968994140625, -0.513916015625, -0.415863037109375, -0.31781005859375, -0.219757080078125, -0.1217041015625, -0.023651123046875, 0.07440185546875, 0.172454833984375, 0.2705078125, 0.368560791015625, 0.46661376953125, 0.564666748046875, 0.6627197265625, 0.760772705078125, 0.85882568359375, 0.956878662109375, 1.054931640625, 1.152984619140625, 1.25103759765625, 1.349090576171875, 1.4471435546875, 1.545196533203125, 1.64324951171875, 1.741302490234375, 1.83935546875, 1.937408447265625, 2.03546142578125, 2.133514404296875, 2.2315673828125, 2.329620361328125, 2.42767333984375, 2.525726318359375, 2.623779296875, 2.721832275390625, 2.81988525390625, 2.917938232421875, 3.0159912109375, 3.114044189453125, 3.21209716796875, 3.310150146484375, 3.408203125]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 5.0, 15.0, 28.0, 72.0, 87.0, 117.0, 158.0, 172.0, 130.0, 95.0, 49.0, 37.0, 15.0, 6.0, 6.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.59375, -0.5757675170898438, -0.5577850341796875, -0.5398025512695312, -0.521820068359375, -0.5038375854492188, -0.4858551025390625, -0.46787261962890625, -0.44989013671875, -0.43190765380859375, -0.4139251708984375, -0.39594268798828125, -0.377960205078125, -0.35997772216796875, -0.3419952392578125, -0.32401275634765625, -0.3060302734375, -0.28804779052734375, -0.2700653076171875, -0.25208282470703125, -0.234100341796875, -0.21611785888671875, -0.1981353759765625, -0.18015289306640625, -0.16217041015625, -0.14418792724609375, -0.1262054443359375, -0.10822296142578125, -0.090240478515625, -0.07225799560546875, -0.0542755126953125, -0.03629302978515625, -0.018310546875, -0.00032806396484375, 0.0176544189453125, 0.03563690185546875, 0.053619384765625, 0.07160186767578125, 0.0895843505859375, 0.10756683349609375, 0.12554931640625, 0.14353179931640625, 0.1615142822265625, 0.17949676513671875, 0.197479248046875, 0.21546173095703125, 0.2334442138671875, 0.25142669677734375, 0.2694091796875, 0.28739166259765625, 0.3053741455078125, 0.32335662841796875, 0.341339111328125, 0.35932159423828125, 0.3773040771484375, 0.39528656005859375, 0.41326904296875, 0.43125152587890625, 0.4492340087890625, 0.46721649169921875, 0.485198974609375, 0.5031814575195312, 0.5211639404296875, 0.5391464233398438, 0.55712890625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 2.0, 3.0, 2.0, 5.0, 6.0, 7.0, 10.0, 9.0, 10.0, 16.0, 27.0, 33.0, 44.0, 66.0, 108.0, 157.0, 265.0, 475.0, 851.0, 1645.0, 3416.0, 8335.0, 27350.0, 140322.0, 625875.0, 187232.0, 34374.0, 9788.0, 3887.0, 1889.0, 943.0, 552.0, 301.0, 215.0, 107.0, 72.0, 47.0, 30.0, 13.0, 14.0, 14.0, 11.0, 12.0, 8.0, 7.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.06640625, -1.991455078125, -1.91650390625, -1.841552734375, -1.7666015625, -1.691650390625, -1.61669921875, -1.541748046875, -1.466796875, -1.391845703125, -1.31689453125, -1.241943359375, -1.1669921875, -1.092041015625, -1.01708984375, -0.942138671875, -0.8671875, -0.792236328125, -0.71728515625, -0.642333984375, -0.5673828125, -0.492431640625, -0.41748046875, -0.342529296875, -0.267578125, -0.192626953125, -0.11767578125, -0.042724609375, 0.0322265625, 0.107177734375, 0.18212890625, 0.257080078125, 0.33203125, 0.406982421875, 0.48193359375, 0.556884765625, 0.6318359375, 0.706787109375, 0.78173828125, 0.856689453125, 0.931640625, 1.006591796875, 1.08154296875, 1.156494140625, 1.2314453125, 1.306396484375, 1.38134765625, 1.456298828125, 1.53125, 1.606201171875, 1.68115234375, 1.756103515625, 1.8310546875, 1.906005859375, 1.98095703125, 2.055908203125, 2.130859375, 2.205810546875, 2.28076171875, 2.355712890625, 2.4306640625, 2.505615234375, 2.58056640625, 2.655517578125, 2.73046875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 0.0, 5.0, 2.0, 5.0, 4.0, 4.0, 6.0, 8.0, 23.0, 22.0, 29.0, 37.0, 62.0, 58.0, 77.0, 63.0, 93.0, 76.0, 89.0, 77.0, 57.0, 51.0, 41.0, 22.0, 25.0, 19.0, 21.0, 8.0, 5.0, 1.0, 3.0, 3.0, 1.0, 2.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.802734375, -1.7398681640625, -1.677001953125, -1.6141357421875, -1.55126953125, -1.4884033203125, -1.425537109375, -1.3626708984375, -1.2998046875, -1.2369384765625, -1.174072265625, -1.1112060546875, -1.04833984375, -0.9854736328125, -0.922607421875, -0.8597412109375, -0.796875, -0.7340087890625, -0.671142578125, -0.6082763671875, -0.54541015625, -0.4825439453125, -0.419677734375, -0.3568115234375, -0.2939453125, -0.2310791015625, -0.168212890625, -0.1053466796875, -0.04248046875, 0.0203857421875, 0.083251953125, 0.1461181640625, 0.208984375, 0.2718505859375, 0.334716796875, 0.3975830078125, 0.46044921875, 0.5233154296875, 0.586181640625, 0.6490478515625, 0.7119140625, 0.7747802734375, 0.837646484375, 0.9005126953125, 0.96337890625, 1.0262451171875, 1.089111328125, 1.1519775390625, 1.21484375, 1.2777099609375, 1.340576171875, 1.4034423828125, 1.46630859375, 1.5291748046875, 1.592041015625, 1.6549072265625, 1.7177734375, 1.7806396484375, 1.843505859375, 1.9063720703125, 1.96923828125, 2.0321044921875, 2.094970703125, 2.1578369140625, 2.220703125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 5.0, 2.0, 11.0, 8.0, 21.0, 39.0, 53.0, 104.0, 224.0, 580.0, 2558.0, 44667.0, 986779.0, 11330.0, 1345.0, 429.0, 201.0, 95.0, 37.0, 33.0, 9.0, 13.0, 6.0, 6.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.5390625, -6.3590087890625, -6.178955078125, -5.9989013671875, -5.81884765625, -5.6387939453125, -5.458740234375, -5.2786865234375, -5.0986328125, -4.9185791015625, -4.738525390625, -4.5584716796875, -4.37841796875, -4.1983642578125, -4.018310546875, -3.8382568359375, -3.658203125, -3.4781494140625, -3.298095703125, -3.1180419921875, -2.93798828125, -2.7579345703125, -2.577880859375, -2.3978271484375, -2.2177734375, -2.0377197265625, -1.857666015625, -1.6776123046875, -1.49755859375, -1.3175048828125, -1.137451171875, -0.9573974609375, -0.77734375, -0.5972900390625, -0.417236328125, -0.2371826171875, -0.05712890625, 0.1229248046875, 0.302978515625, 0.4830322265625, 0.6630859375, 0.8431396484375, 1.023193359375, 1.2032470703125, 1.38330078125, 1.5633544921875, 1.743408203125, 1.9234619140625, 2.103515625, 2.2835693359375, 2.463623046875, 2.6436767578125, 2.82373046875, 3.0037841796875, 3.183837890625, 3.3638916015625, 3.5439453125, 3.7239990234375, 3.904052734375, 4.0841064453125, 4.26416015625, 4.4442138671875, 4.624267578125, 4.8043212890625, 4.984375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 11.0, 9.0, 14.0, 26.0, 41.0, 40.0, 87.0, 125.0, 192.0, 167.0, 104.0, 73.0, 45.0, 10.0, 10.0, 13.0, 10.0, 7.0, 7.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00024008750915527344, -0.0002327561378479004, -0.00022542476654052734, -0.0002180933952331543, -0.00021076202392578125, -0.0002034306526184082, -0.00019609928131103516, -0.0001887679100036621, -0.00018143653869628906, -0.00017410516738891602, -0.00016677379608154297, -0.00015944242477416992, -0.00015211105346679688, -0.00014477968215942383, -0.00013744831085205078, -0.00013011693954467773, -0.0001227855682373047, -0.00011545419692993164, -0.0001081228256225586, -0.00010079145431518555, -9.34600830078125e-05, -8.612871170043945e-05, -7.87973403930664e-05, -7.146596908569336e-05, -6.413459777832031e-05, -5.6803226470947266e-05, -4.947185516357422e-05, -4.214048385620117e-05, -3.4809112548828125e-05, -2.7477741241455078e-05, -2.014636993408203e-05, -1.2814998626708984e-05, -5.4836273193359375e-06, 1.8477439880371094e-06, 9.179115295410156e-06, 1.6510486602783203e-05, 2.384185791015625e-05, 3.11732292175293e-05, 3.8504600524902344e-05, 4.583597183227539e-05, 5.316734313964844e-05, 6.0498714447021484e-05, 6.783008575439453e-05, 7.516145706176758e-05, 8.249282836914062e-05, 8.982419967651367e-05, 9.715557098388672e-05, 0.00010448694229125977, 0.00011181831359863281, 0.00011914968490600586, 0.0001264810562133789, 0.00013381242752075195, 0.000141143798828125, 0.00014847517013549805, 0.0001558065414428711, 0.00016313791275024414, 0.0001704692840576172, 0.00017780065536499023, 0.00018513202667236328, 0.00019246339797973633, 0.00019979476928710938, 0.00020712614059448242, 0.00021445751190185547, 0.00022178888320922852, 0.00022912025451660156]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 12.0, 8.0, 6.0, 10.0, 22.0, 17.0, 39.0, 68.0, 126.0, 156.0, 322.0, 515.0, 1123.0, 2485.0, 6937.0, 27671.0, 400651.0, 559262.0, 35523.0, 8122.0, 2882.0, 1236.0, 565.0, 292.0, 173.0, 113.0, 63.0, 41.0, 34.0, 19.0, 10.0, 16.0, 7.0, 4.0, 7.0, 6.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.8662109375, -1.811431884765625, -1.75665283203125, -1.701873779296875, -1.6470947265625, -1.592315673828125, -1.53753662109375, -1.482757568359375, -1.427978515625, -1.373199462890625, -1.31842041015625, -1.263641357421875, -1.2088623046875, -1.154083251953125, -1.09930419921875, -1.044525146484375, -0.98974609375, -0.934967041015625, -0.88018798828125, -0.825408935546875, -0.7706298828125, -0.715850830078125, -0.66107177734375, -0.606292724609375, -0.551513671875, -0.496734619140625, -0.44195556640625, -0.387176513671875, -0.3323974609375, -0.277618408203125, -0.22283935546875, -0.168060302734375, -0.11328125, -0.058502197265625, -0.00372314453125, 0.051055908203125, 0.1058349609375, 0.160614013671875, 0.21539306640625, 0.270172119140625, 0.324951171875, 0.379730224609375, 0.43450927734375, 0.489288330078125, 0.5440673828125, 0.598846435546875, 0.65362548828125, 0.708404541015625, 0.76318359375, 0.817962646484375, 0.87274169921875, 0.927520751953125, 0.9822998046875, 1.037078857421875, 1.09185791015625, 1.146636962890625, 1.201416015625, 1.256195068359375, 1.31097412109375, 1.365753173828125, 1.4205322265625, 1.475311279296875, 1.53009033203125, 1.584869384765625, 1.6396484375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 1.0, 6.0, 13.0, 17.0, 26.0, 68.0, 141.0, 223.0, 221.0, 126.0, 69.0, 41.0, 17.0, 8.0, 4.0, 4.0, 2.0, 2.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3837890625, -1.3406219482421875, -1.297454833984375, -1.2542877197265625, -1.21112060546875, -1.1679534912109375, -1.124786376953125, -1.0816192626953125, -1.0384521484375, -0.9952850341796875, -0.952117919921875, -0.9089508056640625, -0.86578369140625, -0.8226165771484375, -0.779449462890625, -0.7362823486328125, -0.693115234375, -0.6499481201171875, -0.606781005859375, -0.5636138916015625, -0.52044677734375, -0.4772796630859375, -0.434112548828125, -0.3909454345703125, -0.3477783203125, -0.3046112060546875, -0.261444091796875, -0.2182769775390625, -0.17510986328125, -0.1319427490234375, -0.088775634765625, -0.0456085205078125, -0.00244140625, 0.0407257080078125, 0.083892822265625, 0.1270599365234375, 0.17022705078125, 0.2133941650390625, 0.256561279296875, 0.2997283935546875, 0.3428955078125, 0.3860626220703125, 0.429229736328125, 0.4723968505859375, 0.51556396484375, 0.5587310791015625, 0.601898193359375, 0.6450653076171875, 0.688232421875, 0.7313995361328125, 0.774566650390625, 0.8177337646484375, 0.86090087890625, 0.9040679931640625, 0.947235107421875, 0.9904022216796875, 1.0335693359375, 1.0767364501953125, 1.119903564453125, 1.1630706787109375, 1.20623779296875, 1.2494049072265625, 1.292572021484375, 1.3357391357421875, 1.37890625]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 6.0, 4.0, 8.0, 17.0, 24.0, 37.0, 55.0, 140.0, 203.0, 212.0, 143.0, 73.0, 31.0, 23.0, 8.0, 9.0, 6.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.99288558959961, -16.475082397460938, -15.95727825164795, -15.439474105834961, -14.921669960021973, -14.403865814208984, -13.886062622070312, -13.368258476257324, -12.850454330444336, -12.332650184631348, -11.814846992492676, -11.297042846679688, -10.7792387008667, -10.261434555053711, -9.743631362915039, -9.22582721710205, -8.708024024963379, -8.19021987915039, -7.6724162101745605, -7.1546125411987305, -6.636808395385742, -6.119004726409912, -5.601201057434082, -5.083396911621094, -4.565593242645264, -4.047789573669434, -3.5299854278564453, -3.0121817588806152, -2.494377851486206, -1.9765739440917969, -1.4587702751159668, -0.9409663677215576, -0.42316246032714844, 0.09464138746261597, 0.6124452352523804, 1.1302490234375, 1.6480529308319092, 2.1658568382263184, 2.6836605072021484, 3.2014644145965576, 3.719268321990967, 4.237071990966797, 4.754876136779785, 5.272679805755615, 5.790483474731445, 6.308287620544434, 6.826091289520264, 7.343894958496094, 7.861699104309082, 8.37950325012207, 8.897306442260742, 9.41511058807373, 9.932914733886719, 10.45071792602539, 10.968522071838379, 11.486326217651367, 12.004129409790039, 12.521933555603027, 13.0397367477417, 13.557540893554688, 14.075345039367676, 14.593149185180664, 15.110952377319336, 15.628756523132324, 16.146560668945312]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 3.0, 6.0, 5.0, 7.0, 9.0, 16.0, 23.0, 19.0, 32.0, 39.0, 42.0, 60.0, 52.0, 55.0, 76.0, 71.0, 86.0, 53.0, 51.0, 60.0, 37.0, 33.0, 37.0, 26.0, 25.0, 18.0, 12.0, 14.0, 11.0, 10.0, 6.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-14.542821884155273, -14.108731269836426, -13.674640655517578, -13.24055004119873, -12.806459426879883, -12.372369766235352, -11.938279151916504, -11.504188537597656, -11.070097923278809, -10.636007308959961, -10.201916694641113, -9.767826080322266, -9.333736419677734, -8.89964485168457, -8.465555191040039, -8.031464576721191, -7.597373962402344, -7.163283348083496, -6.729192733764648, -6.295102596282959, -5.861011981964111, -5.426921367645264, -4.992831230163574, -4.558740615844727, -4.124650001525879, -3.6905593872070312, -3.2564690113067627, -2.822378635406494, -2.3882880210876465, -1.9541974067687988, -1.5201070308685303, -1.0860166549682617, -0.6519260406494141, -0.21783554553985596, 0.21625494956970215, 0.6503454446792603, 1.0844359397888184, 1.518526554107666, 1.9526169300079346, 2.386707305908203, 2.820797920227051, 3.2548885345458984, 3.688978910446167, 4.1230692863464355, 4.557159900665283, 4.991250514984131, 5.42534065246582, 5.859431266784668, 6.293521881103516, 6.727612495422363, 7.161703109741211, 7.5957932472229, 8.029884338378906, 8.463973999023438, 8.898064613342285, 9.332155227661133, 9.76624584197998, 10.200336456298828, 10.634427070617676, 11.068517684936523, 11.502607345581055, 11.936698913574219, 12.37078857421875, 12.804879188537598, 13.238969802856445]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 5.0, 4.0, 5.0, 12.0, 5.0, 11.0, 7.0, 11.0, 18.0, 24.0, 24.0, 32.0, 42.0, 51.0, 71.0, 78.0, 104.0, 144.0, 195.0, 262.0, 361.0, 552.0, 838.0, 1502.0, 2551.0, 5224.0, 11179.0, 28399.0, 107046.0, 3193786.0, 723786.0, 75447.0, 22802.0, 9428.0, 4444.0, 2390.0, 1266.0, 739.0, 495.0, 299.0, 219.0, 135.0, 101.0, 56.0, 38.0, 35.0, 33.0, 8.0, 11.0, 4.0, 6.0, 4.0, 1.0, 2.0, 1.0], "bins": [-3.189453125, -3.107421875, -3.025390625, -2.943359375, -2.861328125, -2.779296875, -2.697265625, -2.615234375, -2.533203125, -2.451171875, -2.369140625, -2.287109375, -2.205078125, -2.123046875, -2.041015625, -1.958984375, -1.876953125, -1.794921875, -1.712890625, -1.630859375, -1.548828125, -1.466796875, -1.384765625, -1.302734375, -1.220703125, -1.138671875, -1.056640625, -0.974609375, -0.892578125, -0.810546875, -0.728515625, -0.646484375, -0.564453125, -0.482421875, -0.400390625, -0.318359375, -0.236328125, -0.154296875, -0.072265625, 0.009765625, 0.091796875, 0.173828125, 0.255859375, 0.337890625, 0.419921875, 0.501953125, 0.583984375, 0.666015625, 0.748046875, 0.830078125, 0.912109375, 0.994140625, 1.076171875, 1.158203125, 1.240234375, 1.322265625, 1.404296875, 1.486328125, 1.568359375, 1.650390625, 1.732421875, 1.814453125, 1.896484375, 1.978515625, 2.060546875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 6.0, 8.0, 10.0, 13.0, 22.0, 33.0, 49.0, 60.0, 84.0, 69.0, 77.0, 100.0, 93.0, 61.0, 61.0, 66.0, 43.0, 42.0, 39.0, 15.0, 10.0, 10.0, 7.0, 7.0, 1.0, 3.0, 2.0, 0.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.529296875, -0.5162696838378906, -0.5032424926757812, -0.4902153015136719, -0.4771881103515625, -0.4641609191894531, -0.45113372802734375, -0.4381065368652344, -0.425079345703125, -0.4120521545410156, -0.39902496337890625, -0.3859977722167969, -0.3729705810546875, -0.3599433898925781, -0.34691619873046875, -0.3338890075683594, -0.32086181640625, -0.3078346252441406, -0.29480743408203125, -0.2817802429199219, -0.2687530517578125, -0.2557258605957031, -0.24269866943359375, -0.22967147827148438, -0.216644287109375, -0.20361709594726562, -0.19058990478515625, -0.17756271362304688, -0.1645355224609375, -0.15150833129882812, -0.13848114013671875, -0.12545394897460938, -0.1124267578125, -0.09939956665039062, -0.08637237548828125, -0.07334518432617188, -0.0603179931640625, -0.047290802001953125, -0.03426361083984375, -0.021236419677734375, -0.008209228515625, 0.004817962646484375, 0.01784515380859375, 0.030872344970703125, 0.0438995361328125, 0.056926727294921875, 0.06995391845703125, 0.08298110961914062, 0.09600830078125, 0.10903549194335938, 0.12206268310546875, 0.13508987426757812, 0.1481170654296875, 0.16114425659179688, 0.17417144775390625, 0.18719863891601562, 0.200225830078125, 0.21325302124023438, 0.22628021240234375, 0.23930740356445312, 0.2523345947265625, 0.2653617858886719, 0.27838897705078125, 0.2914161682128906, 0.304443359375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 3.0, 5.0, 10.0, 12.0, 14.0, 24.0, 46.0, 82.0, 128.0, 248.0, 518.0, 1246.0, 3289.0, 13288.0, 154921.0, 3921132.0, 83921.0, 10237.0, 2893.0, 1161.0, 490.0, 263.0, 131.0, 78.0, 58.0, 30.0, 15.0, 7.0, 2.0, 6.0, 2.0, 8.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0], "bins": [-4.5, -4.36529541015625, -4.2305908203125, -4.09588623046875, -3.961181640625, -3.82647705078125, -3.6917724609375, -3.55706787109375, -3.42236328125, -3.28765869140625, -3.1529541015625, -3.01824951171875, -2.883544921875, -2.74884033203125, -2.6141357421875, -2.47943115234375, -2.3447265625, -2.21002197265625, -2.0753173828125, -1.94061279296875, -1.805908203125, -1.67120361328125, -1.5364990234375, -1.40179443359375, -1.26708984375, -1.13238525390625, -0.9976806640625, -0.86297607421875, -0.728271484375, -0.59356689453125, -0.4588623046875, -0.32415771484375, -0.189453125, -0.05474853515625, 0.0799560546875, 0.21466064453125, 0.349365234375, 0.48406982421875, 0.6187744140625, 0.75347900390625, 0.88818359375, 1.02288818359375, 1.1575927734375, 1.29229736328125, 1.427001953125, 1.56170654296875, 1.6964111328125, 1.83111572265625, 1.9658203125, 2.10052490234375, 2.2352294921875, 2.36993408203125, 2.504638671875, 2.63934326171875, 2.7740478515625, 2.90875244140625, 3.04345703125, 3.17816162109375, 3.3128662109375, 3.44757080078125, 3.582275390625, 3.71697998046875, 3.8516845703125, 3.98638916015625, 4.12109375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 2.0, 4.0, 9.0, 12.0, 16.0, 21.0, 39.0, 58.0, 100.0, 176.0, 469.0, 2117.0, 570.0, 194.0, 85.0, 67.0, 36.0, 39.0, 15.0, 7.0, 7.0, 7.0, 2.0, 7.0, 6.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.61572265625, -0.5925521850585938, -0.5693817138671875, -0.5462112426757812, -0.523040771484375, -0.49987030029296875, -0.4766998291015625, -0.45352935791015625, -0.43035888671875, -0.40718841552734375, -0.3840179443359375, -0.36084747314453125, -0.337677001953125, -0.31450653076171875, -0.2913360595703125, -0.26816558837890625, -0.2449951171875, -0.22182464599609375, -0.1986541748046875, -0.17548370361328125, -0.152313232421875, -0.12914276123046875, -0.1059722900390625, -0.08280181884765625, -0.05963134765625, -0.03646087646484375, -0.0132904052734375, 0.00988006591796875, 0.033050537109375, 0.05622100830078125, 0.0793914794921875, 0.10256195068359375, 0.125732421875, 0.14890289306640625, 0.1720733642578125, 0.19524383544921875, 0.218414306640625, 0.24158477783203125, 0.2647552490234375, 0.28792572021484375, 0.31109619140625, 0.33426666259765625, 0.3574371337890625, 0.38060760498046875, 0.403778076171875, 0.42694854736328125, 0.4501190185546875, 0.47328948974609375, 0.4964599609375, 0.5196304321289062, 0.5428009033203125, 0.5659713745117188, 0.589141845703125, 0.6123123168945312, 0.6354827880859375, 0.6586532592773438, 0.68182373046875, 0.7049942016601562, 0.7281646728515625, 0.7513351440429688, 0.774505615234375, 0.7976760864257812, 0.8208465576171875, 0.8440170288085938, 0.8671875]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 20.0, 33.0, 128.0, 256.0, 339.0, 139.0, 56.0, 17.0, 13.0, 4.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-10.124211311340332, -9.889419555664062, -9.65462875366211, -9.41983699798584, -9.18504524230957, -8.950254440307617, -8.715462684631348, -8.480670928955078, -8.245880126953125, -8.011088371276855, -7.776297092437744, -7.541505813598633, -7.3067145347595215, -7.07192325592041, -6.837131500244141, -6.602340221405029, -6.36754846572876, -6.132757186889648, -5.897965431213379, -5.663174152374268, -5.428382873535156, -5.193591117858887, -4.958799839019775, -4.724008560180664, -4.4892168045043945, -4.254425525665283, -4.019633769989014, -3.7848424911499023, -3.550051212310791, -3.3152596950531006, -3.08046817779541, -2.845676898956299, -2.6108856201171875, -2.376094102859497, -2.1413028240203857, -1.9065113067626953, -1.6717199087142944, -1.4369285106658936, -1.2021369934082031, -0.9673455953598022, -0.7325541973114014, -0.4977627694606781, -0.26297134160995483, -0.02817988395690918, 0.2066115140914917, 0.4414029121398926, 0.676194429397583, 0.9109858274459839, 1.1457772254943848, 1.3805686235427856, 1.6153600215911865, 1.850151538848877, 2.0849428176879883, 2.3197343349456787, 2.554525852203369, 2.7893171310424805, 3.024108648300171, 3.2589001655578613, 3.4936914443969727, 3.728482961654663, 3.9632744789123535, 4.198065757751465, 4.432857513427734, 4.667648792266846, 4.902440071105957]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 4.0, 6.0, 7.0, 9.0, 16.0, 20.0, 18.0, 31.0, 45.0, 52.0, 54.0, 44.0, 60.0, 70.0, 65.0, 60.0, 63.0, 54.0, 56.0, 58.0, 43.0, 35.0, 27.0, 24.0, 20.0, 20.0, 13.0, 9.0, 4.0, 4.0, 4.0, 2.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1959757804870605, -2.1162328720092773, -2.036489963531494, -1.9567471742630005, -1.8770042657852173, -1.797261357307434, -1.7175185680389404, -1.6377756595611572, -1.558032751083374, -1.4782898426055908, -1.3985469341278076, -1.318804144859314, -1.2390612363815308, -1.1593183279037476, -1.079575538635254, -0.9998326301574707, -0.9200897216796875, -0.8403468132019043, -0.7606039643287659, -0.6808611154556274, -0.6011182069778442, -0.521375298500061, -0.4416324496269226, -0.3618896007537842, -0.282146692276001, -0.20240381360054016, -0.12266093492507935, -0.04291805624961853, 0.036824822425842285, 0.1165677011013031, 0.19631057977676392, 0.27605342864990234, 0.35579633712768555, 0.43553921580314636, 0.5152820944786072, 0.5950249433517456, 0.6747678518295288, 0.754510760307312, 0.8342536091804504, 0.9139964580535889, 0.9937393665313721, 1.0734822750091553, 1.1532251834869385, 1.2329679727554321, 1.3127108812332153, 1.3924537897109985, 1.4721965789794922, 1.5519394874572754, 1.6316823959350586, 1.7114253044128418, 1.791168212890625, 1.8709110021591187, 1.9506539106369019, 2.0303966999053955, 2.1101396083831787, 2.189882516860962, 2.269625425338745, 2.3493683338165283, 2.4291112422943115, 2.5088541507720947, 2.588596820831299, 2.668339729309082, 2.7480826377868652, 2.8278255462646484, 2.9075684547424316]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 10.0, 10.0, 10.0, 17.0, 20.0, 27.0, 38.0, 55.0, 87.0, 115.0, 214.0, 306.0, 467.0, 879.0, 1536.0, 2904.0, 6466.0, 17007.0, 56175.0, 246303.0, 509209.0, 147731.0, 36676.0, 12047.0, 4826.0, 2328.0, 1165.0, 729.0, 424.0, 259.0, 157.0, 114.0, 64.0, 52.0, 41.0, 31.0, 23.0, 9.0, 6.0, 7.0, 6.0, 3.0, 3.0, 4.0, 1.0, 2.0], "bins": [-2.5, -2.434783935546875, -2.36956787109375, -2.304351806640625, -2.2391357421875, -2.173919677734375, -2.10870361328125, -2.043487548828125, -1.978271484375, -1.913055419921875, -1.84783935546875, -1.782623291015625, -1.7174072265625, -1.652191162109375, -1.58697509765625, -1.521759033203125, -1.45654296875, -1.391326904296875, -1.32611083984375, -1.260894775390625, -1.1956787109375, -1.130462646484375, -1.06524658203125, -1.000030517578125, -0.934814453125, -0.869598388671875, -0.80438232421875, -0.739166259765625, -0.6739501953125, -0.608734130859375, -0.54351806640625, -0.478302001953125, -0.4130859375, -0.347869873046875, -0.28265380859375, -0.217437744140625, -0.1522216796875, -0.087005615234375, -0.02178955078125, 0.043426513671875, 0.108642578125, 0.173858642578125, 0.23907470703125, 0.304290771484375, 0.3695068359375, 0.434722900390625, 0.49993896484375, 0.565155029296875, 0.63037109375, 0.695587158203125, 0.76080322265625, 0.826019287109375, 0.8912353515625, 0.956451416015625, 1.02166748046875, 1.086883544921875, 1.152099609375, 1.217315673828125, 1.28253173828125, 1.347747802734375, 1.4129638671875, 1.478179931640625, 1.54339599609375, 1.608612060546875, 1.673828125]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 5.0, 3.0, 3.0, 2.0, 4.0, 4.0, 14.0, 16.0, 20.0, 36.0, 61.0, 74.0, 88.0, 96.0, 94.0, 107.0, 77.0, 77.0, 65.0, 41.0, 37.0, 21.0, 23.0, 13.0, 7.0, 3.0, 6.0, 2.0, 2.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58837890625, -0.5732498168945312, -0.5581207275390625, -0.5429916381835938, -0.527862548828125, -0.5127334594726562, -0.4976043701171875, -0.48247528076171875, -0.46734619140625, -0.45221710205078125, -0.4370880126953125, -0.42195892333984375, -0.406829833984375, -0.39170074462890625, -0.3765716552734375, -0.36144256591796875, -0.3463134765625, -0.33118438720703125, -0.3160552978515625, -0.30092620849609375, -0.285797119140625, -0.27066802978515625, -0.2555389404296875, -0.24040985107421875, -0.22528076171875, -0.21015167236328125, -0.1950225830078125, -0.17989349365234375, -0.164764404296875, -0.14963531494140625, -0.1345062255859375, -0.11937713623046875, -0.104248046875, -0.08911895751953125, -0.0739898681640625, -0.05886077880859375, -0.043731689453125, -0.02860260009765625, -0.0134735107421875, 0.00165557861328125, 0.01678466796875, 0.03191375732421875, 0.0470428466796875, 0.06217193603515625, 0.077301025390625, 0.09243011474609375, 0.1075592041015625, 0.12268829345703125, 0.1378173828125, 0.15294647216796875, 0.1680755615234375, 0.18320465087890625, 0.198333740234375, 0.21346282958984375, 0.2285919189453125, 0.24372100830078125, 0.25885009765625, 0.27397918701171875, 0.2891082763671875, 0.30423736572265625, 0.319366455078125, 0.33449554443359375, 0.3496246337890625, 0.36475372314453125, 0.3798828125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 1.0, 1.0, 7.0, 4.0, 8.0, 19.0, 12.0, 33.0, 34.0, 40.0, 70.0, 94.0, 118.0, 207.0, 299.0, 620.0, 1082.0, 2035.0, 3976.0, 8658.0, 22841.0, 76346.0, 338952.0, 438871.0, 104457.0, 29264.0, 10598.0, 4633.0, 2320.0, 1199.0, 672.0, 405.0, 238.0, 137.0, 79.0, 67.0, 36.0, 30.0, 25.0, 27.0, 15.0, 6.0, 6.0, 2.0, 5.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6240234375, -1.5682373046875, -1.512451171875, -1.4566650390625, -1.40087890625, -1.3450927734375, -1.289306640625, -1.2335205078125, -1.177734375, -1.1219482421875, -1.066162109375, -1.0103759765625, -0.95458984375, -0.8988037109375, -0.843017578125, -0.7872314453125, -0.7314453125, -0.6756591796875, -0.619873046875, -0.5640869140625, -0.50830078125, -0.4525146484375, -0.396728515625, -0.3409423828125, -0.28515625, -0.2293701171875, -0.173583984375, -0.1177978515625, -0.06201171875, -0.0062255859375, 0.049560546875, 0.1053466796875, 0.1611328125, 0.2169189453125, 0.272705078125, 0.3284912109375, 0.38427734375, 0.4400634765625, 0.495849609375, 0.5516357421875, 0.607421875, 0.6632080078125, 0.718994140625, 0.7747802734375, 0.83056640625, 0.8863525390625, 0.942138671875, 0.9979248046875, 1.0537109375, 1.1094970703125, 1.165283203125, 1.2210693359375, 1.27685546875, 1.3326416015625, 1.388427734375, 1.4442138671875, 1.5, 1.5557861328125, 1.611572265625, 1.6673583984375, 1.72314453125, 1.7789306640625, 1.834716796875, 1.8905029296875, 1.9462890625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 5.0, 6.0, 3.0, 6.0, 7.0, 14.0, 13.0, 19.0, 27.0, 38.0, 38.0, 47.0, 56.0, 76.0, 74.0, 79.0, 72.0, 73.0, 65.0, 58.0, 45.0, 31.0, 27.0, 27.0, 22.0, 20.0, 7.0, 7.0, 5.0, 7.0, 8.0, 4.0, 3.0, 3.0, 3.0, 5.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.77734375, -1.716552734375, -1.65576171875, -1.594970703125, -1.5341796875, -1.473388671875, -1.41259765625, -1.351806640625, -1.291015625, -1.230224609375, -1.16943359375, -1.108642578125, -1.0478515625, -0.987060546875, -0.92626953125, -0.865478515625, -0.8046875, -0.743896484375, -0.68310546875, -0.622314453125, -0.5615234375, -0.500732421875, -0.43994140625, -0.379150390625, -0.318359375, -0.257568359375, -0.19677734375, -0.135986328125, -0.0751953125, -0.014404296875, 0.04638671875, 0.107177734375, 0.16796875, 0.228759765625, 0.28955078125, 0.350341796875, 0.4111328125, 0.471923828125, 0.53271484375, 0.593505859375, 0.654296875, 0.715087890625, 0.77587890625, 0.836669921875, 0.8974609375, 0.958251953125, 1.01904296875, 1.079833984375, 1.140625, 1.201416015625, 1.26220703125, 1.322998046875, 1.3837890625, 1.444580078125, 1.50537109375, 1.566162109375, 1.626953125, 1.687744140625, 1.74853515625, 1.809326171875, 1.8701171875, 1.930908203125, 1.99169921875, 2.052490234375, 2.11328125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 3.0, 3.0, 1.0, 5.0, 8.0, 7.0, 13.0, 15.0, 21.0, 35.0, 68.0, 80.0, 172.0, 473.0, 1233.0, 4781.0, 30394.0, 711924.0, 279068.0, 15705.0, 2961.0, 887.0, 322.0, 145.0, 82.0, 44.0, 32.0, 18.0, 13.0, 15.0, 12.0, 3.0, 3.0, 3.0, 5.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3388671875, -1.2954559326171875, -1.252044677734375, -1.2086334228515625, -1.16522216796875, -1.1218109130859375, -1.078399658203125, -1.0349884033203125, -0.9915771484375, -0.9481658935546875, -0.904754638671875, -0.8613433837890625, -0.81793212890625, -0.7745208740234375, -0.731109619140625, -0.6876983642578125, -0.644287109375, -0.6008758544921875, -0.557464599609375, -0.5140533447265625, -0.47064208984375, -0.4272308349609375, -0.383819580078125, -0.3404083251953125, -0.2969970703125, -0.2535858154296875, -0.210174560546875, -0.1667633056640625, -0.12335205078125, -0.0799407958984375, -0.036529541015625, 0.0068817138671875, 0.05029296875, 0.0937042236328125, 0.137115478515625, 0.1805267333984375, 0.22393798828125, 0.2673492431640625, 0.310760498046875, 0.3541717529296875, 0.3975830078125, 0.4409942626953125, 0.484405517578125, 0.5278167724609375, 0.57122802734375, 0.6146392822265625, 0.658050537109375, 0.7014617919921875, 0.744873046875, 0.7882843017578125, 0.831695556640625, 0.8751068115234375, 0.91851806640625, 0.9619293212890625, 1.005340576171875, 1.0487518310546875, 1.0921630859375, 1.1355743408203125, 1.178985595703125, 1.2223968505859375, 1.26580810546875, 1.3092193603515625, 1.352630615234375, 1.3960418701171875, 1.439453125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 5.0, 7.0, 10.0, 16.0, 14.0, 12.0, 21.0, 23.0, 30.0, 44.0, 59.0, 59.0, 88.0, 99.0, 110.0, 63.0, 68.0, 66.0, 50.0, 33.0, 25.0, 23.0, 17.0, 6.0, 2.0, 10.0, 8.0, 6.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.071826934814453e-05, -8.77799466252327e-05, -8.484162390232086e-05, -8.190330117940903e-05, -7.896497845649719e-05, -7.602665573358536e-05, -7.308833301067352e-05, -7.015001028776169e-05, -6.721168756484985e-05, -6.427336484193802e-05, -6.133504211902618e-05, -5.839671939611435e-05, -5.5458396673202515e-05, -5.252007395029068e-05, -4.9581751227378845e-05, -4.664342850446701e-05, -4.3705105781555176e-05, -4.076678305864334e-05, -3.7828460335731506e-05, -3.489013761281967e-05, -3.195181488990784e-05, -2.9013492166996002e-05, -2.6075169444084167e-05, -2.3136846721172333e-05, -2.0198523998260498e-05, -1.7260201275348663e-05, -1.4321878552436829e-05, -1.1383555829524994e-05, -8.44523310661316e-06, -5.5069103837013245e-06, -2.5685876607894897e-06, 3.6973506212234497e-07, 3.3080577850341797e-06, 6.246380507946014e-06, 9.184703230857849e-06, 1.2123025953769684e-05, 1.5061348676681519e-05, 1.7999671399593353e-05, 2.0937994122505188e-05, 2.3876316845417023e-05, 2.6814639568328857e-05, 2.9752962291240692e-05, 3.269128501415253e-05, 3.562960773706436e-05, 3.8567930459976196e-05, 4.150625318288803e-05, 4.4444575905799866e-05, 4.73828986287117e-05, 5.0321221351623535e-05, 5.325954407453537e-05, 5.6197866797447205e-05, 5.913618952035904e-05, 6.207451224327087e-05, 6.501283496618271e-05, 6.795115768909454e-05, 7.088948041200638e-05, 7.382780313491821e-05, 7.676612585783005e-05, 7.970444858074188e-05, 8.264277130365372e-05, 8.558109402656555e-05, 8.851941674947739e-05, 9.145773947238922e-05, 9.439606219530106e-05, 9.733438491821289e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 8.0, 7.0, 10.0, 13.0, 21.0, 35.0, 58.0, 83.0, 83.0, 151.0, 258.0, 388.0, 696.0, 1455.0, 2926.0, 7007.0, 19449.0, 80842.0, 544797.0, 321897.0, 44996.0, 13219.0, 5166.0, 2303.0, 1093.0, 563.0, 345.0, 224.0, 139.0, 99.0, 58.0, 46.0, 34.0, 28.0, 24.0, 7.0, 5.0, 8.0, 5.0, 4.0, 0.0, 4.0, 2.0, 1.0, 1.0], "bins": [-0.8017578125, -0.7805633544921875, -0.759368896484375, -0.7381744384765625, -0.71697998046875, -0.6957855224609375, -0.674591064453125, -0.6533966064453125, -0.6322021484375, -0.6110076904296875, -0.589813232421875, -0.5686187744140625, -0.54742431640625, -0.5262298583984375, -0.505035400390625, -0.4838409423828125, -0.462646484375, -0.4414520263671875, -0.420257568359375, -0.3990631103515625, -0.37786865234375, -0.3566741943359375, -0.335479736328125, -0.3142852783203125, -0.2930908203125, -0.2718963623046875, -0.250701904296875, -0.2295074462890625, -0.20831298828125, -0.1871185302734375, -0.165924072265625, -0.1447296142578125, -0.12353515625, -0.1023406982421875, -0.081146240234375, -0.0599517822265625, -0.03875732421875, -0.0175628662109375, 0.003631591796875, 0.0248260498046875, 0.0460205078125, 0.0672149658203125, 0.088409423828125, 0.1096038818359375, 0.13079833984375, 0.1519927978515625, 0.173187255859375, 0.1943817138671875, 0.215576171875, 0.2367706298828125, 0.257965087890625, 0.2791595458984375, 0.30035400390625, 0.3215484619140625, 0.342742919921875, 0.3639373779296875, 0.3851318359375, 0.4063262939453125, 0.427520751953125, 0.4487152099609375, 0.46990966796875, 0.4911041259765625, 0.512298583984375, 0.5334930419921875, 0.5546875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 6.0, 3.0, 8.0, 5.0, 6.0, 16.0, 23.0, 50.0, 74.0, 117.0, 161.0, 145.0, 137.0, 82.0, 63.0, 42.0, 16.0, 10.0, 10.0, 8.0, 6.0, 5.0, 5.0, 4.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8642578125, -0.841064453125, -0.81787109375, -0.794677734375, -0.771484375, -0.748291015625, -0.72509765625, -0.701904296875, -0.6787109375, -0.655517578125, -0.63232421875, -0.609130859375, -0.5859375, -0.562744140625, -0.53955078125, -0.516357421875, -0.4931640625, -0.469970703125, -0.44677734375, -0.423583984375, -0.400390625, -0.377197265625, -0.35400390625, -0.330810546875, -0.3076171875, -0.284423828125, -0.26123046875, -0.238037109375, -0.21484375, -0.191650390625, -0.16845703125, -0.145263671875, -0.1220703125, -0.098876953125, -0.07568359375, -0.052490234375, -0.029296875, -0.006103515625, 0.01708984375, 0.040283203125, 0.0634765625, 0.086669921875, 0.10986328125, 0.133056640625, 0.15625, 0.179443359375, 0.20263671875, 0.225830078125, 0.2490234375, 0.272216796875, 0.29541015625, 0.318603515625, 0.341796875, 0.364990234375, 0.38818359375, 0.411376953125, 0.4345703125, 0.457763671875, 0.48095703125, 0.504150390625, 0.52734375, 0.550537109375, 0.57373046875, 0.596923828125, 0.6201171875]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 9.0, 18.0, 78.0, 240.0, 442.0, 147.0, 51.0, 16.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.11605453491211, -11.13099193572998, -10.145928382873535, -9.160865783691406, -8.175802230834961, -7.190739631652832, -6.205677032470703, -5.220613956451416, -4.235550880432129, -3.250487804412842, -2.265424966812134, -1.2803621292114258, -0.29529905319213867, 0.6897640228271484, 1.6748266220092773, 2.6598896980285645, 3.6449527740478516, 4.630015850067139, 5.615078926086426, 6.600141525268555, 7.585204601287842, 8.570267677307129, 9.555330276489258, 10.540393829345703, 11.525456428527832, 12.510519027709961, 13.495582580566406, 14.480645179748535, 15.465707778930664, 16.45077133178711, 17.435832977294922, 18.420896530151367, 19.405960083007812, 20.391023635864258, 21.37608528137207, 22.361148834228516, 23.34621238708496, 24.331275939941406, 25.31633758544922, 26.301401138305664, 27.28646469116211, 28.271528244018555, 29.256589889526367, 30.241653442382812, 31.226716995239258, 32.2117805480957, 33.196842193603516, 34.18190383911133, 35.166969299316406, 36.15203094482422, 37.1370964050293, 38.12215805053711, 39.10721969604492, 40.09228515625, 41.07734680175781, 42.062408447265625, 43.04747009277344, 44.03253173828125, 45.01759719848633, 46.00265884399414, 46.98772048950195, 47.97278594970703, 48.957847595214844, 49.942909240722656, 50.927974700927734]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 3.0, 8.0, 13.0, 19.0, 21.0, 32.0, 50.0, 61.0, 60.0, 80.0, 81.0, 89.0, 92.0, 76.0, 69.0, 60.0, 49.0, 38.0, 41.0, 23.0, 17.0, 9.0, 6.0, 6.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.135910034179688, -11.665919303894043, -11.195928573608398, -10.725937843322754, -10.25594711303711, -9.785955429077148, -9.315964698791504, -8.84597396850586, -8.375983238220215, -7.90599250793457, -7.436001777648926, -6.966010570526123, -6.4960198402404785, -6.026029109954834, -5.556037902832031, -5.086047172546387, -4.616056442260742, -4.146065711975098, -3.676074743270874, -3.2060837745666504, -2.736093044281006, -2.2661023139953613, -1.7961113452911377, -1.326120376586914, -0.8561296463012695, -0.38613879680633545, 0.08385205268859863, 0.5538429021835327, 1.0238337516784668, 1.4938244819641113, 1.963815450668335, 2.4338064193725586, 2.903797149658203, 3.3737878799438477, 3.8437788486480713, 4.313769817352295, 4.7837605476379395, 5.253751277923584, 5.723742485046387, 6.193733215332031, 6.663723945617676, 7.13371467590332, 7.603705406188965, 8.07369613647461, 8.54368782043457, 9.013677597045898, 9.48366928100586, 9.953660011291504, 10.423650741577148, 10.893641471862793, 11.363632202148438, 11.833622932434082, 12.303613662719727, 12.773605346679688, 13.243596076965332, 13.713586807250977, 14.183577537536621, 14.653568267822266, 15.12355899810791, 15.593549728393555, 16.063541412353516, 16.533531188964844, 17.003522872924805, 17.473514556884766, 17.943504333496094]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 5.0, 11.0, 9.0, 11.0, 15.0, 14.0, 29.0, 22.0, 31.0, 23.0, 56.0, 70.0, 81.0, 124.0, 197.0, 265.0, 403.0, 658.0, 1189.0, 2189.0, 4750.0, 11641.0, 38283.0, 265997.0, 3679933.0, 142909.0, 27409.0, 9295.0, 3829.0, 1894.0, 1046.0, 623.0, 372.0, 255.0, 159.0, 140.0, 92.0, 78.0, 51.0, 40.0, 25.0, 23.0, 11.0, 4.0, 8.0, 2.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0], "bins": [-2.19140625, -2.13116455078125, -2.0709228515625, -2.01068115234375, -1.950439453125, -1.89019775390625, -1.8299560546875, -1.76971435546875, -1.70947265625, -1.64923095703125, -1.5889892578125, -1.52874755859375, -1.468505859375, -1.40826416015625, -1.3480224609375, -1.28778076171875, -1.2275390625, -1.16729736328125, -1.1070556640625, -1.04681396484375, -0.986572265625, -0.92633056640625, -0.8660888671875, -0.80584716796875, -0.74560546875, -0.68536376953125, -0.6251220703125, -0.56488037109375, -0.504638671875, -0.44439697265625, -0.3841552734375, -0.32391357421875, -0.263671875, -0.20343017578125, -0.1431884765625, -0.08294677734375, -0.022705078125, 0.03753662109375, 0.0977783203125, 0.15802001953125, 0.21826171875, 0.27850341796875, 0.3387451171875, 0.39898681640625, 0.459228515625, 0.51947021484375, 0.5797119140625, 0.63995361328125, 0.7001953125, 0.76043701171875, 0.8206787109375, 0.88092041015625, 0.941162109375, 1.00140380859375, 1.0616455078125, 1.12188720703125, 1.18212890625, 1.24237060546875, 1.3026123046875, 1.36285400390625, 1.423095703125, 1.48333740234375, 1.5435791015625, 1.60382080078125, 1.6640625]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 3.0, 8.0, 4.0, 15.0, 15.0, 18.0, 25.0, 45.0, 39.0, 56.0, 78.0, 74.0, 100.0, 81.0, 79.0, 68.0, 63.0, 57.0, 46.0, 33.0, 22.0, 19.0, 14.0, 9.0, 8.0, 7.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0], "bins": [-0.4619140625, -0.449188232421875, -0.43646240234375, -0.423736572265625, -0.4110107421875, -0.398284912109375, -0.38555908203125, -0.372833251953125, -0.360107421875, -0.347381591796875, -0.33465576171875, -0.321929931640625, -0.3092041015625, -0.296478271484375, -0.28375244140625, -0.271026611328125, -0.25830078125, -0.245574951171875, -0.23284912109375, -0.220123291015625, -0.2073974609375, -0.194671630859375, -0.18194580078125, -0.169219970703125, -0.156494140625, -0.143768310546875, -0.13104248046875, -0.118316650390625, -0.1055908203125, -0.092864990234375, -0.08013916015625, -0.067413330078125, -0.0546875, -0.041961669921875, -0.02923583984375, -0.016510009765625, -0.0037841796875, 0.008941650390625, 0.02166748046875, 0.034393310546875, 0.047119140625, 0.059844970703125, 0.07257080078125, 0.085296630859375, 0.0980224609375, 0.110748291015625, 0.12347412109375, 0.136199951171875, 0.14892578125, 0.161651611328125, 0.17437744140625, 0.187103271484375, 0.1998291015625, 0.212554931640625, 0.22528076171875, 0.238006591796875, 0.250732421875, 0.263458251953125, 0.27618408203125, 0.288909912109375, 0.3016357421875, 0.314361572265625, 0.32708740234375, 0.339813232421875, 0.3525390625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 1.0, 3.0, 4.0, 7.0, 13.0, 6.0, 33.0, 46.0, 64.0, 94.0, 168.0, 303.0, 606.0, 1537.0, 5002.0, 27148.0, 816624.0, 3294427.0, 38437.0, 6125.0, 1997.0, 788.0, 385.0, 211.0, 95.0, 58.0, 39.0, 22.0, 15.0, 8.0, 8.0, 7.0, 1.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.359375, -2.26531982421875, -2.1712646484375, -2.07720947265625, -1.983154296875, -1.88909912109375, -1.7950439453125, -1.70098876953125, -1.60693359375, -1.51287841796875, -1.4188232421875, -1.32476806640625, -1.230712890625, -1.13665771484375, -1.0426025390625, -0.94854736328125, -0.8544921875, -0.76043701171875, -0.6663818359375, -0.57232666015625, -0.478271484375, -0.38421630859375, -0.2901611328125, -0.19610595703125, -0.10205078125, -0.00799560546875, 0.0860595703125, 0.18011474609375, 0.274169921875, 0.36822509765625, 0.4622802734375, 0.55633544921875, 0.650390625, 0.74444580078125, 0.8385009765625, 0.93255615234375, 1.026611328125, 1.12066650390625, 1.2147216796875, 1.30877685546875, 1.40283203125, 1.49688720703125, 1.5909423828125, 1.68499755859375, 1.779052734375, 1.87310791015625, 1.9671630859375, 2.06121826171875, 2.1552734375, 2.24932861328125, 2.3433837890625, 2.43743896484375, 2.531494140625, 2.62554931640625, 2.7196044921875, 2.81365966796875, 2.90771484375, 3.00177001953125, 3.0958251953125, 3.18988037109375, 3.283935546875, 3.37799072265625, 3.4720458984375, 3.56610107421875, 3.66015625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 5.0, 7.0, 5.0, 15.0, 30.0, 34.0, 44.0, 82.0, 164.0, 429.0, 2022.0, 739.0, 238.0, 95.0, 63.0, 28.0, 26.0, 15.0, 10.0, 5.0, 2.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.68994140625, -0.670623779296875, -0.65130615234375, -0.631988525390625, -0.6126708984375, -0.593353271484375, -0.57403564453125, -0.554718017578125, -0.535400390625, -0.516082763671875, -0.49676513671875, -0.477447509765625, -0.4581298828125, -0.438812255859375, -0.41949462890625, -0.400177001953125, -0.380859375, -0.361541748046875, -0.34222412109375, -0.322906494140625, -0.3035888671875, -0.284271240234375, -0.26495361328125, -0.245635986328125, -0.226318359375, -0.207000732421875, -0.18768310546875, -0.168365478515625, -0.1490478515625, -0.129730224609375, -0.11041259765625, -0.091094970703125, -0.07177734375, -0.052459716796875, -0.03314208984375, -0.013824462890625, 0.0054931640625, 0.024810791015625, 0.04412841796875, 0.063446044921875, 0.082763671875, 0.102081298828125, 0.12139892578125, 0.140716552734375, 0.1600341796875, 0.179351806640625, 0.19866943359375, 0.217987060546875, 0.2373046875, 0.256622314453125, 0.27593994140625, 0.295257568359375, 0.3145751953125, 0.333892822265625, 0.35321044921875, 0.372528076171875, 0.391845703125, 0.411163330078125, 0.43048095703125, 0.449798583984375, 0.4691162109375, 0.488433837890625, 0.50775146484375, 0.527069091796875, 0.54638671875]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 9.0, 23.0, 35.0, 47.0, 86.0, 145.0, 187.0, 174.0, 119.0, 68.0, 49.0, 20.0, 23.0, 8.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1480159759521484, -3.045922040939331, -2.9438281059265137, -2.8417341709136963, -2.739640235900879, -2.6375465393066406, -2.5354526042938232, -2.433358669281006, -2.3312647342681885, -2.229170799255371, -2.1270768642425537, -2.0249829292297363, -1.9228891134262085, -1.8207951784133911, -1.7187013626098633, -1.616607427597046, -1.5145134925842285, -1.4124195575714111, -1.3103256225585938, -1.208231806755066, -1.1061378717422485, -1.0040439367294312, -0.9019500613212585, -0.7998561859130859, -0.6977622509002686, -0.5956683158874512, -0.49357444047927856, -0.39148053526878357, -0.2893866300582886, -0.1872926950454712, -0.08519881963729858, 0.016895055770874023, 0.1189889907836914, 0.2210828959941864, 0.3231768012046814, 0.4252707064151764, 0.5273646116256714, 0.6294585466384888, 0.7315524220466614, 0.833646297454834, 0.9357402324676514, 1.0378341674804688, 1.1399281024932861, 1.242021918296814, 1.3441158533096313, 1.4462097883224487, 1.5483036041259766, 1.650397539138794, 1.7524914741516113, 1.8545854091644287, 1.956679344177246, 2.0587732791900635, 2.160867214202881, 2.262960910797119, 2.3650548458099365, 2.467148780822754, 2.5692427158355713, 2.6713366508483887, 2.773430585861206, 2.8755245208740234, 2.9776182174682617, 3.079712390899658, 3.1818060874938965, 3.283900022506714, 3.3859939575195312]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 6.0, 8.0, 10.0, 8.0, 9.0, 17.0, 17.0, 30.0, 39.0, 28.0, 39.0, 36.0, 47.0, 41.0, 40.0, 46.0, 68.0, 56.0, 51.0, 46.0, 49.0, 44.0, 35.0, 34.0, 35.0, 30.0, 18.0, 24.0, 18.0, 13.0, 15.0, 10.0, 9.0, 8.0, 7.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.5459598302841187, -1.4918259382247925, -1.4376921653747559, -1.3835582733154297, -1.3294243812561035, -1.275290608406067, -1.2211567163467407, -1.167022943496704, -1.112889051437378, -1.0587551593780518, -1.0046213865280151, -0.950487494468689, -0.8963536620140076, -0.8422198295593262, -0.7880859375, -0.7339521050453186, -0.6798182725906372, -0.6256844401359558, -0.5715506076812744, -0.5174167156219482, -0.46328288316726685, -0.40914905071258545, -0.35501518845558167, -0.3008813261985779, -0.24674749374389648, -0.1926136463880539, -0.1384797990322113, -0.08434595167636871, -0.030212104320526123, 0.023921728134155273, 0.07805559039115906, 0.13218945264816284, 0.1863234043121338, 0.24045725166797638, 0.29459109902381897, 0.34872496128082275, 0.40285879373550415, 0.45699262619018555, 0.5111265182495117, 0.5652603507041931, 0.6193941831588745, 0.6735280156135559, 0.7276618480682373, 0.7817957401275635, 0.8359295725822449, 0.8900634050369263, 0.9441972970962524, 0.9983311295509338, 1.0524649620056152, 1.1065988540649414, 1.160732626914978, 1.2148665189743042, 1.2690002918243408, 1.323134183883667, 1.3772680759429932, 1.4314019680023193, 1.485535740852356, 1.5396696329116821, 1.5938034057617188, 1.647937297821045, 1.702071189880371, 1.7562049627304077, 1.8103388547897339, 1.8644726276397705, 1.9186065196990967]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 4.0, 9.0, 7.0, 11.0, 22.0, 30.0, 42.0, 56.0, 64.0, 132.0, 184.0, 291.0, 473.0, 867.0, 1504.0, 2831.0, 6262.0, 17450.0, 69233.0, 334411.0, 463733.0, 110032.0, 25040.0, 8135.0, 3417.0, 1749.0, 976.0, 568.0, 375.0, 219.0, 160.0, 102.0, 57.0, 42.0, 19.0, 11.0, 10.0, 6.0, 6.0, 2.0, 3.0, 1.0, 4.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-1.8974609375, -1.8345184326171875, -1.771575927734375, -1.7086334228515625, -1.64569091796875, -1.5827484130859375, -1.519805908203125, -1.4568634033203125, -1.3939208984375, -1.3309783935546875, -1.268035888671875, -1.2050933837890625, -1.14215087890625, -1.0792083740234375, -1.016265869140625, -0.9533233642578125, -0.890380859375, -0.8274383544921875, -0.764495849609375, -0.7015533447265625, -0.63861083984375, -0.5756683349609375, -0.512725830078125, -0.4497833251953125, -0.3868408203125, -0.3238983154296875, -0.260955810546875, -0.1980133056640625, -0.13507080078125, -0.0721282958984375, -0.009185791015625, 0.0537567138671875, 0.11669921875, 0.1796417236328125, 0.242584228515625, 0.3055267333984375, 0.36846923828125, 0.4314117431640625, 0.494354248046875, 0.5572967529296875, 0.6202392578125, 0.6831817626953125, 0.746124267578125, 0.8090667724609375, 0.87200927734375, 0.9349517822265625, 0.997894287109375, 1.0608367919921875, 1.123779296875, 1.1867218017578125, 1.249664306640625, 1.3126068115234375, 1.37554931640625, 1.4384918212890625, 1.501434326171875, 1.5643768310546875, 1.6273193359375, 1.6902618408203125, 1.753204345703125, 1.8161468505859375, 1.87908935546875, 1.9420318603515625, 2.004974365234375, 2.0679168701171875, 2.130859375]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 3.0, 4.0, 6.0, 10.0, 13.0, 9.0, 29.0, 27.0, 50.0, 52.0, 71.0, 92.0, 80.0, 91.0, 88.0, 86.0, 65.0, 59.0, 45.0, 38.0, 32.0, 16.0, 10.0, 7.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.497314453125, -0.4833412170410156, -0.46936798095703125, -0.4553947448730469, -0.4414215087890625, -0.4274482727050781, -0.41347503662109375, -0.3995018005371094, -0.385528564453125, -0.3715553283691406, -0.35758209228515625, -0.3436088562011719, -0.3296356201171875, -0.3156623840332031, -0.30168914794921875, -0.2877159118652344, -0.27374267578125, -0.2597694396972656, -0.24579620361328125, -0.23182296752929688, -0.2178497314453125, -0.20387649536132812, -0.18990325927734375, -0.17593002319335938, -0.161956787109375, -0.14798355102539062, -0.13401031494140625, -0.12003707885742188, -0.1060638427734375, -0.09209060668945312, -0.07811737060546875, -0.06414413452148438, -0.0501708984375, -0.036197662353515625, -0.02222442626953125, -0.008251190185546875, 0.0057220458984375, 0.019695281982421875, 0.03366851806640625, 0.047641754150390625, 0.061614990234375, 0.07558822631835938, 0.08956146240234375, 0.10353469848632812, 0.1175079345703125, 0.13148117065429688, 0.14545440673828125, 0.15942764282226562, 0.17340087890625, 0.18737411499023438, 0.20134735107421875, 0.21532058715820312, 0.2292938232421875, 0.24326705932617188, 0.25724029541015625, 0.2712135314941406, 0.285186767578125, 0.2991600036621094, 0.31313323974609375, 0.3271064758300781, 0.3410797119140625, 0.3550529479980469, 0.36902618408203125, 0.3829994201660156, 0.39697265625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 8.0, 12.0, 10.0, 25.0, 32.0, 50.0, 55.0, 89.0, 128.0, 179.0, 319.0, 598.0, 1185.0, 2516.0, 6352.0, 19212.0, 75328.0, 366338.0, 442402.0, 96914.0, 23372.0, 7519.0, 2929.0, 1292.0, 631.0, 386.0, 243.0, 157.0, 97.0, 55.0, 30.0, 21.0, 26.0, 20.0, 6.0, 6.0, 8.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7490234375, -1.6945037841796875, -1.639984130859375, -1.5854644775390625, -1.53094482421875, -1.4764251708984375, -1.421905517578125, -1.3673858642578125, -1.3128662109375, -1.2583465576171875, -1.203826904296875, -1.1493072509765625, -1.09478759765625, -1.0402679443359375, -0.985748291015625, -0.9312286376953125, -0.876708984375, -0.8221893310546875, -0.767669677734375, -0.7131500244140625, -0.65863037109375, -0.6041107177734375, -0.549591064453125, -0.4950714111328125, -0.4405517578125, -0.3860321044921875, -0.331512451171875, -0.2769927978515625, -0.22247314453125, -0.1679534912109375, -0.113433837890625, -0.0589141845703125, -0.00439453125, 0.0501251220703125, 0.104644775390625, 0.1591644287109375, 0.21368408203125, 0.2682037353515625, 0.322723388671875, 0.3772430419921875, 0.4317626953125, 0.4862823486328125, 0.540802001953125, 0.5953216552734375, 0.64984130859375, 0.7043609619140625, 0.758880615234375, 0.8134002685546875, 0.867919921875, 0.9224395751953125, 0.976959228515625, 1.0314788818359375, 1.08599853515625, 1.1405181884765625, 1.195037841796875, 1.2495574951171875, 1.3040771484375, 1.3585968017578125, 1.413116455078125, 1.4676361083984375, 1.52215576171875, 1.5766754150390625, 1.631195068359375, 1.6857147216796875, 1.740234375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 6.0, 6.0, 3.0, 5.0, 3.0, 6.0, 10.0, 12.0, 13.0, 27.0, 29.0, 36.0, 35.0, 46.0, 53.0, 62.0, 63.0, 63.0, 50.0, 61.0, 72.0, 55.0, 62.0, 37.0, 30.0, 35.0, 30.0, 21.0, 14.0, 12.0, 14.0, 11.0, 9.0, 3.0, 6.0, 3.0, 1.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.94140625, -1.8896026611328125, -1.837799072265625, -1.7859954833984375, -1.73419189453125, -1.6823883056640625, -1.630584716796875, -1.5787811279296875, -1.5269775390625, -1.4751739501953125, -1.423370361328125, -1.3715667724609375, -1.31976318359375, -1.2679595947265625, -1.216156005859375, -1.1643524169921875, -1.112548828125, -1.0607452392578125, -1.008941650390625, -0.9571380615234375, -0.90533447265625, -0.8535308837890625, -0.801727294921875, -0.7499237060546875, -0.6981201171875, -0.6463165283203125, -0.594512939453125, -0.5427093505859375, -0.49090576171875, -0.4391021728515625, -0.387298583984375, -0.3354949951171875, -0.28369140625, -0.2318878173828125, -0.180084228515625, -0.1282806396484375, -0.07647705078125, -0.0246734619140625, 0.027130126953125, 0.0789337158203125, 0.1307373046875, 0.1825408935546875, 0.234344482421875, 0.2861480712890625, 0.33795166015625, 0.3897552490234375, 0.441558837890625, 0.4933624267578125, 0.545166015625, 0.5969696044921875, 0.648773193359375, 0.7005767822265625, 0.75238037109375, 0.8041839599609375, 0.855987548828125, 0.9077911376953125, 0.9595947265625, 1.0113983154296875, 1.063201904296875, 1.1150054931640625, 1.16680908203125, 1.2186126708984375, 1.270416259765625, 1.3222198486328125, 1.3740234375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 5.0, 7.0, 11.0, 11.0, 14.0, 27.0, 55.0, 93.0, 167.0, 308.0, 704.0, 1895.0, 6973.0, 48827.0, 671121.0, 291244.0, 20693.0, 4006.0, 1302.0, 514.0, 255.0, 139.0, 72.0, 54.0, 18.0, 13.0, 12.0, 5.0, 4.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.05859375, -1.0281829833984375, -0.997772216796875, -0.9673614501953125, -0.93695068359375, -0.9065399169921875, -0.876129150390625, -0.8457183837890625, -0.8153076171875, -0.7848968505859375, -0.754486083984375, -0.7240753173828125, -0.69366455078125, -0.6632537841796875, -0.632843017578125, -0.6024322509765625, -0.572021484375, -0.5416107177734375, -0.511199951171875, -0.4807891845703125, -0.45037841796875, -0.4199676513671875, -0.389556884765625, -0.3591461181640625, -0.3287353515625, -0.2983245849609375, -0.267913818359375, -0.2375030517578125, -0.20709228515625, -0.1766815185546875, -0.146270751953125, -0.1158599853515625, -0.08544921875, -0.0550384521484375, -0.024627685546875, 0.0057830810546875, 0.03619384765625, 0.0666046142578125, 0.097015380859375, 0.1274261474609375, 0.1578369140625, 0.1882476806640625, 0.218658447265625, 0.2490692138671875, 0.27947998046875, 0.3098907470703125, 0.340301513671875, 0.3707122802734375, 0.401123046875, 0.4315338134765625, 0.461944580078125, 0.4923553466796875, 0.52276611328125, 0.5531768798828125, 0.583587646484375, 0.6139984130859375, 0.6444091796875, 0.6748199462890625, 0.705230712890625, 0.7356414794921875, 0.76605224609375, 0.7964630126953125, 0.826873779296875, 0.8572845458984375, 0.8876953125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 7.0, 9.0, 11.0, 25.0, 23.0, 25.0, 41.0, 60.0, 72.0, 88.0, 98.0, 104.0, 96.0, 81.0, 65.0, 52.0, 44.0, 28.0, 19.0, 14.0, 7.0, 4.0, 12.0, 7.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011944770812988281, -0.00011563487350940704, -0.00011182203888893127, -0.0001080092042684555, -0.00010419636964797974, -0.00010038353502750397, -9.65707004070282e-05, -9.275786578655243e-05, -8.894503116607666e-05, -8.513219654560089e-05, -8.131936192512512e-05, -7.750652730464935e-05, -7.369369268417358e-05, -6.988085806369781e-05, -6.606802344322205e-05, -6.225518882274628e-05, -5.844235420227051e-05, -5.462951958179474e-05, -5.081668496131897e-05, -4.70038503408432e-05, -4.319101572036743e-05, -3.937818109989166e-05, -3.5565346479415894e-05, -3.1752511858940125e-05, -2.7939677238464355e-05, -2.4126842617988586e-05, -2.0314007997512817e-05, -1.650117337703705e-05, -1.268833875656128e-05, -8.87550413608551e-06, -5.062669515609741e-06, -1.2498348951339722e-06, 2.562999725341797e-06, 6.375834345817566e-06, 1.0188668966293335e-05, 1.4001503586769104e-05, 1.7814338207244873e-05, 2.1627172827720642e-05, 2.544000744819641e-05, 2.925284206867218e-05, 3.306567668914795e-05, 3.687851130962372e-05, 4.069134593009949e-05, 4.4504180550575256e-05, 4.8317015171051025e-05, 5.2129849791526794e-05, 5.5942684412002563e-05, 5.975551903247833e-05, 6.35683536529541e-05, 6.738118827342987e-05, 7.119402289390564e-05, 7.500685751438141e-05, 7.881969213485718e-05, 8.263252675533295e-05, 8.644536137580872e-05, 9.025819599628448e-05, 9.407103061676025e-05, 9.788386523723602e-05, 0.00010169669985771179, 0.00010550953447818756, 0.00010932236909866333, 0.0001131352037191391, 0.00011694803833961487, 0.00012076087296009064, 0.0001245737075805664]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 12.0, 9.0, 23.0, 33.0, 70.0, 119.0, 268.0, 698.0, 2157.0, 10511.0, 143935.0, 810995.0, 70055.0, 7029.0, 1591.0, 575.0, 252.0, 95.0, 45.0, 28.0, 24.0, 11.0, 9.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4365234375, -1.4041595458984375, -1.371795654296875, -1.3394317626953125, -1.30706787109375, -1.2747039794921875, -1.242340087890625, -1.2099761962890625, -1.1776123046875, -1.1452484130859375, -1.112884521484375, -1.0805206298828125, -1.04815673828125, -1.0157928466796875, -0.983428955078125, -0.9510650634765625, -0.918701171875, -0.8863372802734375, -0.853973388671875, -0.8216094970703125, -0.78924560546875, -0.7568817138671875, -0.724517822265625, -0.6921539306640625, -0.6597900390625, -0.6274261474609375, -0.595062255859375, -0.5626983642578125, -0.53033447265625, -0.4979705810546875, -0.465606689453125, -0.4332427978515625, -0.40087890625, -0.3685150146484375, -0.336151123046875, -0.3037872314453125, -0.27142333984375, -0.2390594482421875, -0.206695556640625, -0.1743316650390625, -0.1419677734375, -0.1096038818359375, -0.077239990234375, -0.0448760986328125, -0.01251220703125, 0.0198516845703125, 0.052215576171875, 0.0845794677734375, 0.116943359375, 0.1493072509765625, 0.181671142578125, 0.2140350341796875, 0.24639892578125, 0.2787628173828125, 0.311126708984375, 0.3434906005859375, 0.3758544921875, 0.4082183837890625, 0.440582275390625, 0.4729461669921875, 0.50531005859375, 0.5376739501953125, 0.570037841796875, 0.6024017333984375, 0.634765625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 2.0, 8.0, 10.0, 21.0, 19.0, 47.0, 31.0, 68.0, 92.0, 110.0, 122.0, 137.0, 97.0, 65.0, 56.0, 44.0, 23.0, 13.0, 12.0, 9.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.7294921875, -0.7124176025390625, -0.695343017578125, -0.6782684326171875, -0.66119384765625, -0.6441192626953125, -0.627044677734375, -0.6099700927734375, -0.5928955078125, -0.5758209228515625, -0.558746337890625, -0.5416717529296875, -0.52459716796875, -0.5075225830078125, -0.490447998046875, -0.4733734130859375, -0.456298828125, -0.4392242431640625, -0.422149658203125, -0.4050750732421875, -0.38800048828125, -0.3709259033203125, -0.353851318359375, -0.3367767333984375, -0.3197021484375, -0.3026275634765625, -0.285552978515625, -0.2684783935546875, -0.25140380859375, -0.2343292236328125, -0.217254638671875, -0.2001800537109375, -0.18310546875, -0.1660308837890625, -0.148956298828125, -0.1318817138671875, -0.11480712890625, -0.0977325439453125, -0.080657958984375, -0.0635833740234375, -0.0465087890625, -0.0294342041015625, -0.012359619140625, 0.0047149658203125, 0.02178955078125, 0.0388641357421875, 0.055938720703125, 0.0730133056640625, 0.090087890625, 0.1071624755859375, 0.124237060546875, 0.1413116455078125, 0.15838623046875, 0.1754608154296875, 0.192535400390625, 0.2096099853515625, 0.2266845703125, 0.2437591552734375, 0.260833740234375, 0.2779083251953125, 0.29498291015625, 0.3120574951171875, 0.329132080078125, 0.3462066650390625, 0.36328125]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 5.0, 11.0, 5.0, 7.0, 16.0, 20.0, 34.0, 47.0, 81.0, 120.0, 162.0, 158.0, 126.0, 69.0, 53.0, 39.0, 18.0, 14.0, 8.0, 5.0, 2.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-12.183361053466797, -11.862210273742676, -11.541058540344238, -11.219907760620117, -10.898756980895996, -10.577606201171875, -10.256454467773438, -9.935303688049316, -9.614152908325195, -9.293002128601074, -8.971850395202637, -8.650699615478516, -8.329548835754395, -8.008398056030273, -7.687246322631836, -7.366095542907715, -7.044943809509277, -6.723792552947998, -6.402641773223877, -6.081490516662598, -5.760339736938477, -5.439188480377197, -5.118037223815918, -4.796886444091797, -4.475735187530518, -4.154583930969238, -3.833433151245117, -3.512281894683838, -3.1911308765411377, -2.8699798583984375, -2.548828601837158, -2.227677583694458, -1.9065256118774414, -1.5853745937347412, -1.2642234563827515, -0.9430723786354065, -0.6219213008880615, -0.30077028274536133, 0.020380854606628418, 0.34153199195861816, 0.6626830101013184, 0.9838340878486633, 1.3049851655960083, 1.626136302947998, 1.9472873210906982, 2.2684383392333984, 2.5895895957946777, 2.910740613937378, 3.231891632080078, 3.5530426502227783, 3.8741936683654785, 4.195344924926758, 4.516495704650879, 4.837646961212158, 5.1587982177734375, 5.479948997497559, 5.801100254058838, 6.122251510620117, 6.443402290344238, 6.764553546905518, 7.085704803466797, 7.406855583190918, 7.728006839752197, 8.049158096313477, 8.370308876037598]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 8.0, 5.0, 12.0, 15.0, 21.0, 25.0, 25.0, 47.0, 43.0, 65.0, 51.0, 59.0, 85.0, 79.0, 75.0, 84.0, 67.0, 54.0, 30.0, 36.0, 26.0, 32.0, 13.0, 14.0, 15.0, 2.0, 6.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-16.267683029174805, -15.89025592803955, -15.51282787322998, -15.135400772094727, -14.757972717285156, -14.380545616149902, -14.003117561340332, -13.625690460205078, -13.248262405395508, -12.870835304260254, -12.493407249450684, -12.11598014831543, -11.73855209350586, -11.361124992370605, -10.983696937561035, -10.606269836425781, -10.228841781616211, -9.851414680480957, -9.473986625671387, -9.096559524536133, -8.719131469726562, -8.341704368591309, -7.964276313781738, -7.586849212646484, -7.2094221115112305, -6.831994533538818, -6.454566955566406, -6.077139377593994, -5.699711799621582, -5.32228422164917, -4.944856643676758, -4.567429542541504, -4.190001487731934, -3.8125739097595215, -3.4351463317871094, -3.0577187538146973, -2.680291175842285, -2.302863597869873, -1.92543625831604, -1.548008680343628, -1.1705811023712158, -0.7931535243988037, -0.4157260060310364, -0.03829848766326904, 0.33912909030914307, 0.7165566682815552, 1.0939841270446777, 1.4714117050170898, 1.848839282989502, 2.226266860961914, 2.603694438934326, 2.9811220169067383, 3.3585495948791504, 3.7359771728515625, 4.113404273986816, 4.490832328796387, 4.868259429931641, 5.245687007904053, 5.623114585876465, 6.000542163848877, 6.377969741821289, 6.755397319793701, 7.132824897766113, 7.510251998901367, 7.8876800537109375]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 8.0, 10.0, 15.0, 17.0, 20.0, 28.0, 27.0, 44.0, 39.0, 55.0, 66.0, 106.0, 122.0, 196.0, 262.0, 365.0, 586.0, 1003.0, 1834.0, 3794.0, 8953.0, 27618.0, 151565.0, 3674503.0, 265498.0, 36975.0, 11083.0, 4393.0, 2130.0, 1082.0, 636.0, 430.0, 245.0, 160.0, 108.0, 74.0, 61.0, 37.0, 31.0, 22.0, 22.0, 22.0, 10.0, 9.0, 4.0, 6.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-2.4140625, -2.34222412109375, -2.2703857421875, -2.19854736328125, -2.126708984375, -2.05487060546875, -1.9830322265625, -1.91119384765625, -1.83935546875, -1.76751708984375, -1.6956787109375, -1.62384033203125, -1.552001953125, -1.48016357421875, -1.4083251953125, -1.33648681640625, -1.2646484375, -1.19281005859375, -1.1209716796875, -1.04913330078125, -0.977294921875, -0.90545654296875, -0.8336181640625, -0.76177978515625, -0.68994140625, -0.61810302734375, -0.5462646484375, -0.47442626953125, -0.402587890625, -0.33074951171875, -0.2589111328125, -0.18707275390625, -0.115234375, -0.04339599609375, 0.0284423828125, 0.10028076171875, 0.172119140625, 0.24395751953125, 0.3157958984375, 0.38763427734375, 0.45947265625, 0.53131103515625, 0.6031494140625, 0.67498779296875, 0.746826171875, 0.81866455078125, 0.8905029296875, 0.96234130859375, 1.0341796875, 1.10601806640625, 1.1778564453125, 1.24969482421875, 1.321533203125, 1.39337158203125, 1.4652099609375, 1.53704833984375, 1.60888671875, 1.68072509765625, 1.7525634765625, 1.82440185546875, 1.896240234375, 1.96807861328125, 2.0399169921875, 2.11175537109375, 2.18359375]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 6.0, 2.0, 12.0, 18.0, 20.0, 31.0, 53.0, 56.0, 71.0, 88.0, 94.0, 91.0, 89.0, 69.0, 77.0, 51.0, 46.0, 39.0, 30.0, 17.0, 10.0, 9.0, 5.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.47998046875, -0.466064453125, -0.4521484375, -0.438232421875, -0.42431640625, -0.410400390625, -0.396484375, -0.382568359375, -0.36865234375, -0.354736328125, -0.3408203125, -0.326904296875, -0.31298828125, -0.299072265625, -0.28515625, -0.271240234375, -0.25732421875, -0.243408203125, -0.2294921875, -0.215576171875, -0.20166015625, -0.187744140625, -0.173828125, -0.159912109375, -0.14599609375, -0.132080078125, -0.1181640625, -0.104248046875, -0.09033203125, -0.076416015625, -0.0625, -0.048583984375, -0.03466796875, -0.020751953125, -0.0068359375, 0.007080078125, 0.02099609375, 0.034912109375, 0.048828125, 0.062744140625, 0.07666015625, 0.090576171875, 0.1044921875, 0.118408203125, 0.13232421875, 0.146240234375, 0.16015625, 0.174072265625, 0.18798828125, 0.201904296875, 0.2158203125, 0.229736328125, 0.24365234375, 0.257568359375, 0.271484375, 0.285400390625, 0.29931640625, 0.313232421875, 0.3271484375, 0.341064453125, 0.35498046875, 0.368896484375, 0.3828125, 0.396728515625, 0.41064453125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 2.0, 4.0, 3.0, 2.0, 3.0, 8.0, 7.0, 18.0, 46.0, 78.0, 112.0, 234.0, 507.0, 1160.0, 2944.0, 8940.0, 48239.0, 3818852.0, 286479.0, 18504.0, 4893.0, 1762.0, 715.0, 337.0, 172.0, 99.0, 59.0, 30.0, 27.0, 11.0, 13.0, 8.0, 6.0, 8.0, 0.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.8984375, -2.7813720703125, -2.664306640625, -2.5472412109375, -2.43017578125, -2.3131103515625, -2.196044921875, -2.0789794921875, -1.9619140625, -1.8448486328125, -1.727783203125, -1.6107177734375, -1.49365234375, -1.3765869140625, -1.259521484375, -1.1424560546875, -1.025390625, -0.9083251953125, -0.791259765625, -0.6741943359375, -0.55712890625, -0.4400634765625, -0.322998046875, -0.2059326171875, -0.0888671875, 0.0281982421875, 0.145263671875, 0.2623291015625, 0.37939453125, 0.4964599609375, 0.613525390625, 0.7305908203125, 0.84765625, 0.9647216796875, 1.081787109375, 1.1988525390625, 1.31591796875, 1.4329833984375, 1.550048828125, 1.6671142578125, 1.7841796875, 1.9012451171875, 2.018310546875, 2.1353759765625, 2.25244140625, 2.3695068359375, 2.486572265625, 2.6036376953125, 2.720703125, 2.8377685546875, 2.954833984375, 3.0718994140625, 3.18896484375, 3.3060302734375, 3.423095703125, 3.5401611328125, 3.6572265625, 3.7742919921875, 3.891357421875, 4.0084228515625, 4.12548828125, 4.2425537109375, 4.359619140625, 4.4766845703125, 4.59375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 6.0, 4.0, 5.0, 6.0, 7.0, 17.0, 17.0, 29.0, 76.0, 127.0, 368.0, 2040.0, 932.0, 244.0, 85.0, 44.0, 27.0, 11.0, 5.0, 6.0, 5.0, 6.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9921875, -0.9521484375, -0.912109375, -0.8720703125, -0.83203125, -0.7919921875, -0.751953125, -0.7119140625, -0.671875, -0.6318359375, -0.591796875, -0.5517578125, -0.51171875, -0.4716796875, -0.431640625, -0.3916015625, -0.3515625, -0.3115234375, -0.271484375, -0.2314453125, -0.19140625, -0.1513671875, -0.111328125, -0.0712890625, -0.03125, 0.0087890625, 0.048828125, 0.0888671875, 0.12890625, 0.1689453125, 0.208984375, 0.2490234375, 0.2890625, 0.3291015625, 0.369140625, 0.4091796875, 0.44921875, 0.4892578125, 0.529296875, 0.5693359375, 0.609375, 0.6494140625, 0.689453125, 0.7294921875, 0.76953125, 0.8095703125, 0.849609375, 0.8896484375, 0.9296875, 0.9697265625, 1.009765625, 1.0498046875, 1.08984375, 1.1298828125, 1.169921875, 1.2099609375, 1.25, 1.2900390625, 1.330078125, 1.3701171875, 1.41015625, 1.4501953125, 1.490234375, 1.5302734375, 1.5703125]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 7.0, 11.0, 35.0, 143.0, 305.0, 305.0, 125.0, 42.0, 17.0, 6.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.918496131896973, -13.593974113464355, -13.269453048706055, -12.944931030273438, -12.62040901184082, -12.29588794708252, -11.971365928649902, -11.646844863891602, -11.322322845458984, -10.997800827026367, -10.673279762268066, -10.34875774383545, -10.024236679077148, -9.699714660644531, -9.375192642211914, -9.050670623779297, -8.726149559020996, -8.401627540588379, -8.077106475830078, -7.752584457397461, -7.428062915802002, -7.103541374206543, -6.779019355773926, -6.454497814178467, -6.129976272583008, -5.805454730987549, -5.48093318939209, -5.156411170959473, -4.831889629364014, -4.507368087768555, -4.1828460693359375, -3.8583245277404785, -3.5338029861450195, -3.2092814445495605, -2.8847596645355225, -2.5602378845214844, -2.2357163429260254, -1.9111946821212769, -1.5866730213165283, -1.2621512413024902, -0.9376296997070312, -0.6131080389022827, -0.2885863780975342, 0.035935282707214355, 0.3604569435119629, 0.6849786043167114, 1.00950026512146, 1.334022045135498, 1.658543586730957, 1.9830652475357056, 2.307586908340454, 2.632108688354492, 2.956630229949951, 3.28115177154541, 3.6056735515594482, 3.9301953315734863, 4.254716873168945, 4.579238414764404, 4.903759956359863, 5.2282819747924805, 5.5528035163879395, 5.877325057983398, 6.201847076416016, 6.526368618011475, 6.850890159606934]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 11.0, 8.0, 8.0, 9.0, 25.0, 25.0, 34.0, 38.0, 57.0, 55.0, 67.0, 63.0, 94.0, 73.0, 80.0, 79.0, 62.0, 52.0, 38.0, 40.0, 28.0, 21.0, 15.0, 5.0, 6.0, 1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.513881683349609, -4.385019302368164, -4.256156921386719, -4.127294063568115, -3.99843168258667, -3.8695693016052246, -3.7407069206237793, -3.611844539642334, -3.4829819202423096, -3.3541195392608643, -3.22525691986084, -3.0963945388793945, -2.967532157897949, -2.838669538497925, -2.7098071575164795, -2.580944538116455, -2.4520821571350098, -2.3232197761535645, -2.19435715675354, -2.0654947757720947, -1.9366322755813599, -1.807769775390625, -1.6789073944091797, -1.5500448942184448, -1.42118239402771, -1.292319893836975, -1.1634573936462402, -1.034595012664795, -0.9057325124740601, -0.7768700122833252, -0.6480075716972351, -0.519145131111145, -0.39028310775756836, -0.2614206373691559, -0.1325581669807434, -0.0036956965923309326, 0.12516677379608154, 0.2540292739868164, 0.3828917145729065, 0.5117541551589966, 0.6406166553497314, 0.7694791555404663, 0.8983415961265564, 1.0272040367126465, 1.1560665369033813, 1.2849290370941162, 1.4137914180755615, 1.5426539182662964, 1.6715164184570312, 1.8003789186477661, 1.929241418838501, 2.0581037998199463, 2.1869664192199707, 2.315828800201416, 2.4446911811828613, 2.5735535621643066, 2.702416181564331, 2.8312785625457764, 2.960141181945801, 3.089003562927246, 3.2178659439086914, 3.346728563308716, 3.475590944290161, 3.6044535636901855, 3.733315944671631]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 9.0, 4.0, 9.0, 5.0, 13.0, 15.0, 19.0, 25.0, 28.0, 49.0, 50.0, 78.0, 97.0, 145.0, 215.0, 268.0, 394.0, 572.0, 800.0, 1341.0, 2155.0, 4026.0, 9110.0, 29719.0, 147955.0, 547188.0, 236848.0, 43495.0, 11920.0, 4794.0, 2552.0, 1566.0, 945.0, 659.0, 425.0, 288.0, 201.0, 161.0, 99.0, 78.0, 57.0, 42.0, 34.0, 18.0, 23.0, 11.0, 18.0, 9.0, 5.0, 8.0, 7.0, 1.0, 6.0, 5.0, 1.0, 1.0, 1.0], "bins": [-1.9375, -1.8781280517578125, -1.818756103515625, -1.7593841552734375, -1.70001220703125, -1.6406402587890625, -1.581268310546875, -1.5218963623046875, -1.4625244140625, -1.4031524658203125, -1.343780517578125, -1.2844085693359375, -1.22503662109375, -1.1656646728515625, -1.106292724609375, -1.0469207763671875, -0.987548828125, -0.9281768798828125, -0.868804931640625, -0.8094329833984375, -0.75006103515625, -0.6906890869140625, -0.631317138671875, -0.5719451904296875, -0.5125732421875, -0.4532012939453125, -0.393829345703125, -0.3344573974609375, -0.27508544921875, -0.2157135009765625, -0.156341552734375, -0.0969696044921875, -0.03759765625, 0.0217742919921875, 0.081146240234375, 0.1405181884765625, 0.19989013671875, 0.2592620849609375, 0.318634033203125, 0.3780059814453125, 0.4373779296875, 0.4967498779296875, 0.556121826171875, 0.6154937744140625, 0.67486572265625, 0.7342376708984375, 0.793609619140625, 0.8529815673828125, 0.912353515625, 0.9717254638671875, 1.031097412109375, 1.0904693603515625, 1.14984130859375, 1.2092132568359375, 1.268585205078125, 1.3279571533203125, 1.3873291015625, 1.4467010498046875, 1.506072998046875, 1.5654449462890625, 1.62481689453125, 1.6841888427734375, 1.743560791015625, 1.8029327392578125, 1.8623046875]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 5.0, 5.0, 3.0, 9.0, 14.0, 18.0, 35.0, 45.0, 70.0, 95.0, 104.0, 139.0, 100.0, 109.0, 88.0, 53.0, 38.0, 25.0, 14.0, 17.0, 3.0, 3.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.6025390625, -0.5846481323242188, -0.5667572021484375, -0.5488662719726562, -0.530975341796875, -0.5130844116210938, -0.4951934814453125, -0.47730255126953125, -0.45941162109375, -0.44152069091796875, -0.4236297607421875, -0.40573883056640625, -0.387847900390625, -0.36995697021484375, -0.3520660400390625, -0.33417510986328125, -0.3162841796875, -0.29839324951171875, -0.2805023193359375, -0.26261138916015625, -0.244720458984375, -0.22682952880859375, -0.2089385986328125, -0.19104766845703125, -0.17315673828125, -0.15526580810546875, -0.1373748779296875, -0.11948394775390625, -0.101593017578125, -0.08370208740234375, -0.0658111572265625, -0.04792022705078125, -0.030029296875, -0.01213836669921875, 0.0057525634765625, 0.02364349365234375, 0.041534423828125, 0.05942535400390625, 0.0773162841796875, 0.09520721435546875, 0.11309814453125, 0.13098907470703125, 0.1488800048828125, 0.16677093505859375, 0.184661865234375, 0.20255279541015625, 0.2204437255859375, 0.23833465576171875, 0.2562255859375, 0.27411651611328125, 0.2920074462890625, 0.30989837646484375, 0.327789306640625, 0.34568023681640625, 0.3635711669921875, 0.38146209716796875, 0.39935302734375, 0.41724395751953125, 0.4351348876953125, 0.45302581787109375, 0.470916748046875, 0.48880767822265625, 0.5066986083984375, 0.5245895385742188, 0.54248046875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 7.0, 6.0, 11.0, 14.0, 15.0, 17.0, 29.0, 43.0, 57.0, 80.0, 91.0, 178.0, 289.0, 465.0, 853.0, 1622.0, 3329.0, 7738.0, 20960.0, 64275.0, 204074.0, 407638.0, 225997.0, 71943.0, 23205.0, 8342.0, 3452.0, 1580.0, 818.0, 460.0, 343.0, 197.0, 115.0, 75.0, 59.0, 56.0, 27.0, 30.0, 13.0, 14.0, 8.0, 9.0, 8.0, 4.0, 4.0, 1.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-1.0478515625, -1.015655517578125, -0.98345947265625, -0.951263427734375, -0.9190673828125, -0.886871337890625, -0.85467529296875, -0.822479248046875, -0.790283203125, -0.758087158203125, -0.72589111328125, -0.693695068359375, -0.6614990234375, -0.629302978515625, -0.59710693359375, -0.564910888671875, -0.53271484375, -0.500518798828125, -0.46832275390625, -0.436126708984375, -0.4039306640625, -0.371734619140625, -0.33953857421875, -0.307342529296875, -0.275146484375, -0.242950439453125, -0.21075439453125, -0.178558349609375, -0.1463623046875, -0.114166259765625, -0.08197021484375, -0.049774169921875, -0.017578125, 0.014617919921875, 0.04681396484375, 0.079010009765625, 0.1112060546875, 0.143402099609375, 0.17559814453125, 0.207794189453125, 0.239990234375, 0.272186279296875, 0.30438232421875, 0.336578369140625, 0.3687744140625, 0.400970458984375, 0.43316650390625, 0.465362548828125, 0.49755859375, 0.529754638671875, 0.56195068359375, 0.594146728515625, 0.6263427734375, 0.658538818359375, 0.69073486328125, 0.722930908203125, 0.755126953125, 0.787322998046875, 0.81951904296875, 0.851715087890625, 0.8839111328125, 0.916107177734375, 0.94830322265625, 0.980499267578125, 1.0126953125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 4.0, 3.0, 4.0, 3.0, 11.0, 10.0, 20.0, 24.0, 33.0, 35.0, 35.0, 44.0, 44.0, 39.0, 45.0, 49.0, 49.0, 52.0, 50.0, 47.0, 47.0, 39.0, 26.0, 41.0, 42.0, 40.0, 25.0, 28.0, 20.0, 18.0, 20.0, 14.0, 8.0, 8.0, 4.0, 4.0, 6.0, 5.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.07421875, -1.0384674072265625, -1.002716064453125, -0.9669647216796875, -0.93121337890625, -0.8954620361328125, -0.859710693359375, -0.8239593505859375, -0.7882080078125, -0.7524566650390625, -0.716705322265625, -0.6809539794921875, -0.64520263671875, -0.6094512939453125, -0.573699951171875, -0.5379486083984375, -0.502197265625, -0.4664459228515625, -0.430694580078125, -0.3949432373046875, -0.35919189453125, -0.3234405517578125, -0.287689208984375, -0.2519378662109375, -0.2161865234375, -0.1804351806640625, -0.144683837890625, -0.1089324951171875, -0.07318115234375, -0.0374298095703125, -0.001678466796875, 0.0340728759765625, 0.06982421875, 0.1055755615234375, 0.141326904296875, 0.1770782470703125, 0.21282958984375, 0.2485809326171875, 0.284332275390625, 0.3200836181640625, 0.3558349609375, 0.3915863037109375, 0.427337646484375, 0.4630889892578125, 0.49884033203125, 0.5345916748046875, 0.570343017578125, 0.6060943603515625, 0.641845703125, 0.6775970458984375, 0.713348388671875, 0.7490997314453125, 0.78485107421875, 0.8206024169921875, 0.856353759765625, 0.8921051025390625, 0.9278564453125, 0.9636077880859375, 0.999359130859375, 1.0351104736328125, 1.07086181640625, 1.1066131591796875, 1.142364501953125, 1.1781158447265625, 1.2138671875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 12.0, 9.0, 20.0, 25.0, 36.0, 79.0, 140.0, 286.0, 689.0, 2442.0, 14629.0, 336289.0, 660035.0, 28585.0, 3648.0, 928.0, 324.0, 143.0, 84.0, 48.0, 47.0, 23.0, 16.0, 10.0, 5.0, 1.0, 7.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4130859375, -1.3769760131835938, -1.3408660888671875, -1.3047561645507812, -1.268646240234375, -1.2325363159179688, -1.1964263916015625, -1.1603164672851562, -1.12420654296875, -1.0880966186523438, -1.0519866943359375, -1.0158767700195312, -0.979766845703125, -0.9436569213867188, -0.9075469970703125, -0.8714370727539062, -0.8353271484375, -0.7992172241210938, -0.7631072998046875, -0.7269973754882812, -0.690887451171875, -0.6547775268554688, -0.6186676025390625, -0.5825576782226562, -0.54644775390625, -0.5103378295898438, -0.4742279052734375, -0.43811798095703125, -0.402008056640625, -0.36589813232421875, -0.3297882080078125, -0.29367828369140625, -0.257568359375, -0.22145843505859375, -0.1853485107421875, -0.14923858642578125, -0.113128662109375, -0.07701873779296875, -0.0409088134765625, -0.00479888916015625, 0.03131103515625, 0.06742095947265625, 0.1035308837890625, 0.13964080810546875, 0.175750732421875, 0.21186065673828125, 0.2479705810546875, 0.28408050537109375, 0.3201904296875, 0.35630035400390625, 0.3924102783203125, 0.42852020263671875, 0.464630126953125, 0.5007400512695312, 0.5368499755859375, 0.5729598999023438, 0.60906982421875, 0.6451797485351562, 0.6812896728515625, 0.7173995971679688, 0.753509521484375, 0.7896194458007812, 0.8257293701171875, 0.8618392944335938, 0.89794921875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 5.0, 19.0, 25.0, 22.0, 48.0, 72.0, 151.0, 186.0, 185.0, 124.0, 79.0, 45.0, 27.0, 13.0, 4.0, 4.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00029659271240234375, -0.0002903798595070839, -0.00028416700661182404, -0.0002779541537165642, -0.0002717413008213043, -0.00026552844792604446, -0.0002593155950307846, -0.00025310274213552475, -0.0002468898892402649, -0.00024067703634500504, -0.00023446418344974518, -0.00022825133055448532, -0.00022203847765922546, -0.0002158256247639656, -0.00020961277186870575, -0.0002033999189734459, -0.00019718706607818604, -0.00019097421318292618, -0.00018476136028766632, -0.00017854850739240646, -0.0001723356544971466, -0.00016612280160188675, -0.0001599099487066269, -0.00015369709581136703, -0.00014748424291610718, -0.00014127139002084732, -0.00013505853712558746, -0.0001288456842303276, -0.00012263283133506775, -0.00011641997843980789, -0.00011020712554454803, -0.00010399427264928818, -9.778141975402832e-05, -9.156856685876846e-05, -8.53557139635086e-05, -7.914286106824875e-05, -7.293000817298889e-05, -6.671715527772903e-05, -6.050430238246918e-05, -5.429144948720932e-05, -4.807859659194946e-05, -4.1865743696689606e-05, -3.565289080142975e-05, -2.944003790616989e-05, -2.3227185010910034e-05, -1.7014332115650177e-05, -1.080147922039032e-05, -4.588626325130463e-06, 1.6242265701293945e-06, 7.837079465389252e-06, 1.4049932360649109e-05, 2.0262785255908966e-05, 2.6475638151168823e-05, 3.268849104642868e-05, 3.890134394168854e-05, 4.5114196836948395e-05, 5.132704973220825e-05, 5.753990262746811e-05, 6.375275552272797e-05, 6.996560841798782e-05, 7.617846131324768e-05, 8.239131420850754e-05, 8.86041671037674e-05, 9.481701999902725e-05, 0.00010102987289428711]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 5.0, 5.0, 4.0, 10.0, 11.0, 18.0, 18.0, 34.0, 64.0, 122.0, 178.0, 432.0, 877.0, 2112.0, 6519.0, 27920.0, 183318.0, 594887.0, 192797.0, 28529.0, 6717.0, 2236.0, 844.0, 421.0, 223.0, 97.0, 59.0, 38.0, 25.0, 17.0, 9.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52490234375, -0.5064926147460938, -0.4880828857421875, -0.46967315673828125, -0.451263427734375, -0.43285369873046875, -0.4144439697265625, -0.39603424072265625, -0.37762451171875, -0.35921478271484375, -0.3408050537109375, -0.32239532470703125, -0.303985595703125, -0.28557586669921875, -0.2671661376953125, -0.24875640869140625, -0.2303466796875, -0.21193695068359375, -0.1935272216796875, -0.17511749267578125, -0.156707763671875, -0.13829803466796875, -0.1198883056640625, -0.10147857666015625, -0.08306884765625, -0.06465911865234375, -0.0462493896484375, -0.02783966064453125, -0.009429931640625, 0.00897979736328125, 0.0273895263671875, 0.04579925537109375, 0.064208984375, 0.08261871337890625, 0.1010284423828125, 0.11943817138671875, 0.137847900390625, 0.15625762939453125, 0.1746673583984375, 0.19307708740234375, 0.21148681640625, 0.22989654541015625, 0.2483062744140625, 0.26671600341796875, 0.285125732421875, 0.30353546142578125, 0.3219451904296875, 0.34035491943359375, 0.3587646484375, 0.37717437744140625, 0.3955841064453125, 0.41399383544921875, 0.432403564453125, 0.45081329345703125, 0.4692230224609375, 0.48763275146484375, 0.50604248046875, 0.5244522094726562, 0.5428619384765625, 0.5612716674804688, 0.579681396484375, 0.5980911254882812, 0.6165008544921875, 0.6349105834960938, 0.6533203125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 6.0, 7.0, 8.0, 19.0, 16.0, 22.0, 34.0, 40.0, 59.0, 64.0, 79.0, 105.0, 78.0, 87.0, 75.0, 64.0, 66.0, 33.0, 41.0, 25.0, 21.0, 16.0, 10.0, 6.0, 4.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.359375, -0.34468841552734375, -0.3300018310546875, -0.31531524658203125, -0.300628662109375, -0.28594207763671875, -0.2712554931640625, -0.25656890869140625, -0.24188232421875, -0.22719573974609375, -0.2125091552734375, -0.19782257080078125, -0.183135986328125, -0.16844940185546875, -0.1537628173828125, -0.13907623291015625, -0.1243896484375, -0.10970306396484375, -0.0950164794921875, -0.08032989501953125, -0.065643310546875, -0.05095672607421875, -0.0362701416015625, -0.02158355712890625, -0.00689697265625, 0.00778961181640625, 0.0224761962890625, 0.03716278076171875, 0.051849365234375, 0.06653594970703125, 0.0812225341796875, 0.09590911865234375, 0.110595703125, 0.12528228759765625, 0.1399688720703125, 0.15465545654296875, 0.169342041015625, 0.18402862548828125, 0.1987152099609375, 0.21340179443359375, 0.22808837890625, 0.24277496337890625, 0.2574615478515625, 0.27214813232421875, 0.286834716796875, 0.30152130126953125, 0.3162078857421875, 0.33089447021484375, 0.3455810546875, 0.36026763916015625, 0.3749542236328125, 0.38964080810546875, 0.404327392578125, 0.41901397705078125, 0.4337005615234375, 0.44838714599609375, 0.46307373046875, 0.47776031494140625, 0.4924468994140625, 0.5071334838867188, 0.521820068359375, 0.5365066528320312, 0.5511932373046875, 0.5658798217773438, 0.58056640625]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 0.0, 1.0, 4.0, 14.0, 26.0, 68.0, 129.0, 227.0, 242.0, 156.0, 58.0, 45.0, 21.0, 7.0, 3.0, 3.0, 0.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.999469757080078, -18.576515197753906, -18.153560638427734, -17.730607986450195, -17.307653427124023, -16.88469886779785, -16.46174430847168, -16.03879165649414, -15.615837097167969, -15.192882537841797, -14.769928932189941, -14.34697437286377, -13.924020767211914, -13.501066207885742, -13.07811164855957, -12.655158042907715, -12.232203483581543, -11.809248924255371, -11.386295318603516, -10.963340759277344, -10.540387153625488, -10.117432594299316, -9.694478988647461, -9.271524429321289, -8.848569869995117, -8.425615310668945, -8.00266170501709, -7.579707145690918, -7.1567535400390625, -6.733798980712891, -6.310844898223877, -5.887890815734863, -5.464937210083008, -5.041983127593994, -4.6190290451049805, -4.196074485778809, -3.773120641708374, -3.3501665592193604, -2.9272122383117676, -2.504258155822754, -2.0813040733337402, -1.6583499908447266, -1.2353957891464233, -0.8124415874481201, -0.38948750495910645, 0.03346657752990723, 0.4564208984375, 0.8793749809265137, 1.3023290634155273, 1.725283145904541, 2.1482372283935547, 2.5711915493011475, 2.994145631790161, 3.417099714279175, 3.8400540351867676, 4.263008117675781, 4.685962200164795, 5.108916282653809, 5.531870365142822, 5.954824447631836, 6.377779006958008, 6.800732612609863, 7.223687171936035, 7.646641254425049, 8.069595336914062]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 7.0, 5.0, 8.0, 21.0, 15.0, 22.0, 20.0, 26.0, 31.0, 37.0, 31.0, 46.0, 51.0, 52.0, 69.0, 64.0, 67.0, 57.0, 46.0, 60.0, 47.0, 33.0, 43.0, 35.0, 30.0, 19.0, 20.0, 8.0, 14.0, 14.0, 3.0, 1.0, 5.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.585875034332275, -7.340003490447998, -7.094131946563721, -6.848260402679443, -6.602388858795166, -6.356517314910889, -6.1106462478637695, -5.864774703979492, -5.618903160095215, -5.3730316162109375, -5.12716007232666, -4.881288528442383, -4.6354169845581055, -4.389545440673828, -4.143673896789551, -3.8978025913238525, -3.651930809020996, -3.4060592651367188, -3.1601877212524414, -2.914316177368164, -2.6684446334838867, -2.4225730895996094, -2.176701784133911, -1.9308302402496338, -1.6849586963653564, -1.439087152481079, -1.1932156085968018, -0.947344183921814, -0.7014726400375366, -0.4556010961532593, -0.20972967147827148, 0.03614187240600586, 0.282012939453125, 0.5278844833374023, 0.7737559676170349, 1.0196274518966675, 1.2654989957809448, 1.5113705396652222, 1.75724196434021, 2.0031135082244873, 2.2489850521087646, 2.494856595993042, 2.7407281398773193, 2.9865994453430176, 3.232470989227295, 3.4783425331115723, 3.7242140769958496, 3.970085620880127, 4.215957164764404, 4.461828708648682, 4.707700252532959, 4.953571796417236, 5.199443340301514, 5.445314884185791, 5.69118595123291, 5.9370574951171875, 6.182929039001465, 6.428800582885742, 6.6746721267700195, 6.920543670654297, 7.166415214538574, 7.412286758422852, 7.658158302307129, 7.904029846191406, 8.149901390075684]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 2.0, 6.0, 3.0, 4.0, 10.0, 21.0, 9.0, 24.0, 32.0, 43.0, 85.0, 136.0, 233.0, 407.0, 736.0, 1454.0, 4116.0, 21644.0, 1121111.0, 3012390.0, 24269.0, 4391.0, 1522.0, 737.0, 330.0, 221.0, 138.0, 83.0, 42.0, 20.0, 20.0, 14.0, 6.0, 7.0, 7.0, 4.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0], "bins": [-3.50390625, -3.409271240234375, -3.31463623046875, -3.220001220703125, -3.1253662109375, -3.030731201171875, -2.93609619140625, -2.841461181640625, -2.746826171875, -2.652191162109375, -2.55755615234375, -2.462921142578125, -2.3682861328125, -2.273651123046875, -2.17901611328125, -2.084381103515625, -1.98974609375, -1.895111083984375, -1.80047607421875, -1.705841064453125, -1.6112060546875, -1.516571044921875, -1.42193603515625, -1.327301025390625, -1.232666015625, -1.138031005859375, -1.04339599609375, -0.948760986328125, -0.8541259765625, -0.759490966796875, -0.66485595703125, -0.570220947265625, -0.4755859375, -0.380950927734375, -0.28631591796875, -0.191680908203125, -0.0970458984375, -0.002410888671875, 0.09222412109375, 0.186859130859375, 0.281494140625, 0.376129150390625, 0.47076416015625, 0.565399169921875, 0.6600341796875, 0.754669189453125, 0.84930419921875, 0.943939208984375, 1.03857421875, 1.133209228515625, 1.22784423828125, 1.322479248046875, 1.4171142578125, 1.511749267578125, 1.60638427734375, 1.701019287109375, 1.795654296875, 1.890289306640625, 1.98492431640625, 2.079559326171875, 2.1741943359375, 2.268829345703125, 2.36346435546875, 2.458099365234375, 2.552734375]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 8.0, 10.0, 19.0, 35.0, 27.0, 77.0, 103.0, 110.0, 119.0, 122.0, 94.0, 89.0, 71.0, 34.0, 23.0, 24.0, 8.0, 6.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.63525390625, -0.6164703369140625, -0.597686767578125, -0.5789031982421875, -0.56011962890625, -0.5413360595703125, -0.522552490234375, -0.5037689208984375, -0.4849853515625, -0.4662017822265625, -0.447418212890625, -0.4286346435546875, -0.40985107421875, -0.3910675048828125, -0.372283935546875, -0.3535003662109375, -0.334716796875, -0.3159332275390625, -0.297149658203125, -0.2783660888671875, -0.25958251953125, -0.2407989501953125, -0.222015380859375, -0.2032318115234375, -0.1844482421875, -0.1656646728515625, -0.146881103515625, -0.1280975341796875, -0.10931396484375, -0.0905303955078125, -0.071746826171875, -0.0529632568359375, -0.0341796875, -0.0153961181640625, 0.003387451171875, 0.0221710205078125, 0.04095458984375, 0.0597381591796875, 0.078521728515625, 0.0973052978515625, 0.1160888671875, 0.1348724365234375, 0.153656005859375, 0.1724395751953125, 0.19122314453125, 0.2100067138671875, 0.228790283203125, 0.2475738525390625, 0.266357421875, 0.2851409912109375, 0.303924560546875, 0.3227081298828125, 0.34149169921875, 0.3602752685546875, 0.379058837890625, 0.3978424072265625, 0.4166259765625, 0.4354095458984375, 0.454193115234375, 0.4729766845703125, 0.49176025390625, 0.5105438232421875, 0.529327392578125, 0.5481109619140625, 0.56689453125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 7.0, 6.0, 13.0, 10.0, 16.0, 28.0, 47.0, 65.0, 104.0, 169.0, 282.0, 528.0, 1124.0, 2770.0, 11407.0, 96060.0, 3834917.0, 222057.0, 18116.0, 3854.0, 1395.0, 625.0, 277.0, 152.0, 70.0, 52.0, 61.0, 22.0, 17.0, 15.0, 11.0, 5.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.544921875, -2.4822845458984375, -2.419647216796875, -2.3570098876953125, -2.29437255859375, -2.2317352294921875, -2.169097900390625, -2.1064605712890625, -2.0438232421875, -1.9811859130859375, -1.918548583984375, -1.8559112548828125, -1.79327392578125, -1.7306365966796875, -1.667999267578125, -1.6053619384765625, -1.542724609375, -1.4800872802734375, -1.417449951171875, -1.3548126220703125, -1.29217529296875, -1.2295379638671875, -1.166900634765625, -1.1042633056640625, -1.0416259765625, -0.9789886474609375, -0.916351318359375, -0.8537139892578125, -0.79107666015625, -0.7284393310546875, -0.665802001953125, -0.6031646728515625, -0.54052734375, -0.4778900146484375, -0.415252685546875, -0.3526153564453125, -0.28997802734375, -0.2273406982421875, -0.164703369140625, -0.1020660400390625, -0.0394287109375, 0.0232086181640625, 0.085845947265625, 0.1484832763671875, 0.21112060546875, 0.2737579345703125, 0.336395263671875, 0.3990325927734375, 0.461669921875, 0.5243072509765625, 0.586944580078125, 0.6495819091796875, 0.71221923828125, 0.7748565673828125, 0.837493896484375, 0.9001312255859375, 0.9627685546875, 1.0254058837890625, 1.088043212890625, 1.1506805419921875, 1.21331787109375, 1.2759552001953125, 1.338592529296875, 1.4012298583984375, 1.4638671875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 7.0, 9.0, 16.0, 29.0, 55.0, 140.0, 373.0, 2223.0, 848.0, 190.0, 74.0, 46.0, 33.0, 11.0, 7.0, 7.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1083984375, -1.0830612182617188, -1.0577239990234375, -1.0323867797851562, -1.007049560546875, -0.9817123413085938, -0.9563751220703125, -0.9310379028320312, -0.90570068359375, -0.8803634643554688, -0.8550262451171875, -0.8296890258789062, -0.804351806640625, -0.7790145874023438, -0.7536773681640625, -0.7283401489257812, -0.7030029296875, -0.6776657104492188, -0.6523284912109375, -0.6269912719726562, -0.601654052734375, -0.5763168334960938, -0.5509796142578125, -0.5256423950195312, -0.50030517578125, -0.47496795654296875, -0.4496307373046875, -0.42429351806640625, -0.398956298828125, -0.37361907958984375, -0.3482818603515625, -0.32294464111328125, -0.297607421875, -0.27227020263671875, -0.2469329833984375, -0.22159576416015625, -0.196258544921875, -0.17092132568359375, -0.1455841064453125, -0.12024688720703125, -0.09490966796875, -0.06957244873046875, -0.0442352294921875, -0.01889801025390625, 0.006439208984375, 0.03177642822265625, 0.0571136474609375, 0.08245086669921875, 0.1077880859375, 0.13312530517578125, 0.1584625244140625, 0.18379974365234375, 0.209136962890625, 0.23447418212890625, 0.2598114013671875, 0.28514862060546875, 0.31048583984375, 0.33582305908203125, 0.3611602783203125, 0.38649749755859375, 0.411834716796875, 0.43717193603515625, 0.4625091552734375, 0.48784637451171875, 0.51318359375]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 22.0, 44.0, 113.0, 188.0, 246.0, 213.0, 94.0, 39.0, 22.0, 14.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.731424808502197, -5.589971542358398, -5.4485182762146, -5.307065486907959, -5.16561222076416, -5.024158954620361, -4.8827056884765625, -4.741252422332764, -4.599799156188965, -4.458345890045166, -4.316892623901367, -4.175439834594727, -4.033986568450928, -3.892533302307129, -3.75108003616333, -3.6096267700195312, -3.4681739807128906, -3.326720714569092, -3.185267686843872, -3.0438144207000732, -2.9023613929748535, -2.7609081268310547, -2.619454860687256, -2.478001594543457, -2.3365485668182373, -2.1950953006744385, -2.0536422729492188, -1.91218900680542, -1.7707358598709106, -1.6292827129364014, -1.4878294467926025, -1.3463762998580933, -1.2049236297607422, -1.063470482826233, -0.9220172762870789, -0.7805640697479248, -0.6391109228134155, -0.49765777587890625, -0.3562045693397522, -0.21475136280059814, -0.07329821586608887, 0.0681549608707428, 0.20960813760757446, 0.35106131434440613, 0.4925144910812378, 0.6339676380157471, 0.7754208445549011, 0.9168740510940552, 1.0583271980285645, 1.1997803449630737, 1.341233491897583, 1.4826867580413818, 1.6241399049758911, 1.7655930519104004, 1.9070463180541992, 2.048499584197998, 2.1899526119232178, 2.3314058780670166, 2.4728589057922363, 2.614312171936035, 2.755765438079834, 2.8972184658050537, 3.0386717319488525, 3.1801247596740723, 3.321578025817871]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 3.0, 6.0, 5.0, 9.0, 11.0, 10.0, 12.0, 13.0, 31.0, 29.0, 32.0, 43.0, 36.0, 34.0, 55.0, 45.0, 50.0, 56.0, 54.0, 52.0, 63.0, 45.0, 36.0, 36.0, 46.0, 37.0, 29.0, 22.0, 23.0, 24.0, 10.0, 8.0, 12.0, 9.0, 4.0, 4.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8159911632537842, -1.7610372304916382, -1.7060832977294922, -1.6511292457580566, -1.5961753129959106, -1.5412213802337646, -1.4862674474716187, -1.4313135147094727, -1.376359462738037, -1.3214055299758911, -1.2664515972137451, -1.2114975452423096, -1.1565436124801636, -1.1015896797180176, -1.0466357469558716, -0.9916818141937256, -0.9367278814315796, -0.8817739486694336, -0.8268199563026428, -0.7718660235404968, -0.716912031173706, -0.6619580984115601, -0.6070041656494141, -0.5520502328872681, -0.4970962405204773, -0.4421422779560089, -0.3871883153915405, -0.33223438262939453, -0.27728042006492615, -0.22232645750045776, -0.16737252473831177, -0.11241856217384338, -0.057464599609375, -0.002510644495487213, 0.052443310618400574, 0.10739725828170776, 0.16235122084617615, 0.21730518341064453, 0.2722591161727905, 0.3272130787372589, 0.3821670413017273, 0.4371210038661957, 0.49207496643066406, 0.5470288991928101, 0.601982831954956, 0.6569368243217468, 0.7118907570838928, 0.7668447494506836, 0.8217986822128296, 0.8767526149749756, 0.9317066073417664, 0.9866605401039124, 1.0416145324707031, 1.0965684652328491, 1.1515223979949951, 1.2064763307571411, 1.261430263519287, 1.316384196281433, 1.371338129043579, 1.4262921810150146, 1.4812461137771606, 1.5362000465393066, 1.5911539793014526, 1.6461079120635986, 1.7010619640350342]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 5.0, 12.0, 8.0, 20.0, 12.0, 28.0, 26.0, 47.0, 62.0, 100.0, 111.0, 163.0, 237.0, 363.0, 485.0, 723.0, 1046.0, 1715.0, 2884.0, 6307.0, 19033.0, 90177.0, 452068.0, 375415.0, 68958.0, 15558.0, 5386.0, 2770.0, 1582.0, 1012.0, 704.0, 460.0, 323.0, 195.0, 151.0, 104.0, 82.0, 65.0, 54.0, 30.0, 22.0, 13.0, 19.0, 10.0, 9.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.677734375, -1.61541748046875, -1.5531005859375, -1.49078369140625, -1.428466796875, -1.36614990234375, -1.3038330078125, -1.24151611328125, -1.17919921875, -1.11688232421875, -1.0545654296875, -0.99224853515625, -0.929931640625, -0.86761474609375, -0.8052978515625, -0.74298095703125, -0.6806640625, -0.61834716796875, -0.5560302734375, -0.49371337890625, -0.431396484375, -0.36907958984375, -0.3067626953125, -0.24444580078125, -0.18212890625, -0.11981201171875, -0.0574951171875, 0.00482177734375, 0.067138671875, 0.12945556640625, 0.1917724609375, 0.25408935546875, 0.31640625, 0.37872314453125, 0.4410400390625, 0.50335693359375, 0.565673828125, 0.62799072265625, 0.6903076171875, 0.75262451171875, 0.81494140625, 0.87725830078125, 0.9395751953125, 1.00189208984375, 1.064208984375, 1.12652587890625, 1.1888427734375, 1.25115966796875, 1.3134765625, 1.37579345703125, 1.4381103515625, 1.50042724609375, 1.562744140625, 1.62506103515625, 1.6873779296875, 1.74969482421875, 1.81201171875, 1.87432861328125, 1.9366455078125, 1.99896240234375, 2.061279296875, 2.12359619140625, 2.1859130859375, 2.24822998046875, 2.310546875]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 4.0, 6.0, 6.0, 6.0, 30.0, 28.0, 62.0, 70.0, 111.0, 112.0, 134.0, 110.0, 109.0, 78.0, 52.0, 33.0, 20.0, 10.0, 4.0, 6.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.65185546875, -0.63232421875, -0.61279296875, -0.59326171875, -0.57373046875, -0.55419921875, -0.53466796875, -0.51513671875, -0.49560546875, -0.47607421875, -0.45654296875, -0.43701171875, -0.41748046875, -0.39794921875, -0.37841796875, -0.35888671875, -0.33935546875, -0.31982421875, -0.30029296875, -0.28076171875, -0.26123046875, -0.24169921875, -0.22216796875, -0.20263671875, -0.18310546875, -0.16357421875, -0.14404296875, -0.12451171875, -0.10498046875, -0.08544921875, -0.06591796875, -0.04638671875, -0.02685546875, -0.00732421875, 0.01220703125, 0.03173828125, 0.05126953125, 0.07080078125, 0.09033203125, 0.10986328125, 0.12939453125, 0.14892578125, 0.16845703125, 0.18798828125, 0.20751953125, 0.22705078125, 0.24658203125, 0.26611328125, 0.28564453125, 0.30517578125, 0.32470703125, 0.34423828125, 0.36376953125, 0.38330078125, 0.40283203125, 0.42236328125, 0.44189453125, 0.46142578125, 0.48095703125, 0.50048828125, 0.52001953125, 0.53955078125, 0.55908203125, 0.57861328125, 0.59814453125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 5.0, 7.0, 14.0, 20.0, 21.0, 42.0, 45.0, 59.0, 120.0, 173.0, 272.0, 565.0, 1141.0, 2746.0, 7596.0, 23118.0, 82573.0, 295424.0, 427337.0, 147784.0, 39729.0, 12031.0, 4135.0, 1711.0, 797.0, 403.0, 269.0, 155.0, 87.0, 61.0, 42.0, 23.0, 19.0, 10.0, 9.0, 7.0, 6.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.142578125, -1.10711669921875, -1.0716552734375, -1.03619384765625, -1.000732421875, -0.96527099609375, -0.9298095703125, -0.89434814453125, -0.85888671875, -0.82342529296875, -0.7879638671875, -0.75250244140625, -0.717041015625, -0.68157958984375, -0.6461181640625, -0.61065673828125, -0.5751953125, -0.53973388671875, -0.5042724609375, -0.46881103515625, -0.433349609375, -0.39788818359375, -0.3624267578125, -0.32696533203125, -0.29150390625, -0.25604248046875, -0.2205810546875, -0.18511962890625, -0.149658203125, -0.11419677734375, -0.0787353515625, -0.04327392578125, -0.0078125, 0.02764892578125, 0.0631103515625, 0.09857177734375, 0.134033203125, 0.16949462890625, 0.2049560546875, 0.24041748046875, 0.27587890625, 0.31134033203125, 0.3468017578125, 0.38226318359375, 0.417724609375, 0.45318603515625, 0.4886474609375, 0.52410888671875, 0.5595703125, 0.59503173828125, 0.6304931640625, 0.66595458984375, 0.701416015625, 0.73687744140625, 0.7723388671875, 0.80780029296875, 0.84326171875, 0.87872314453125, 0.9141845703125, 0.94964599609375, 0.985107421875, 1.02056884765625, 1.0560302734375, 1.09149169921875, 1.126953125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 8.0, 5.0, 7.0, 14.0, 10.0, 11.0, 22.0, 23.0, 38.0, 20.0, 35.0, 35.0, 56.0, 52.0, 62.0, 52.0, 50.0, 50.0, 56.0, 54.0, 52.0, 52.0, 44.0, 31.0, 31.0, 39.0, 21.0, 23.0, 16.0, 10.0, 7.0, 9.0, 6.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2412109375, -1.2007293701171875, -1.160247802734375, -1.1197662353515625, -1.07928466796875, -1.0388031005859375, -0.998321533203125, -0.9578399658203125, -0.9173583984375, -0.8768768310546875, -0.836395263671875, -0.7959136962890625, -0.75543212890625, -0.7149505615234375, -0.674468994140625, -0.6339874267578125, -0.593505859375, -0.5530242919921875, -0.512542724609375, -0.4720611572265625, -0.43157958984375, -0.3910980224609375, -0.350616455078125, -0.3101348876953125, -0.2696533203125, -0.2291717529296875, -0.188690185546875, -0.1482086181640625, -0.10772705078125, -0.0672454833984375, -0.026763916015625, 0.0137176513671875, 0.05419921875, 0.0946807861328125, 0.135162353515625, 0.1756439208984375, 0.21612548828125, 0.2566070556640625, 0.297088623046875, 0.3375701904296875, 0.3780517578125, 0.4185333251953125, 0.459014892578125, 0.4994964599609375, 0.53997802734375, 0.5804595947265625, 0.620941162109375, 0.6614227294921875, 0.701904296875, 0.7423858642578125, 0.782867431640625, 0.8233489990234375, 0.86383056640625, 0.9043121337890625, 0.944793701171875, 0.9852752685546875, 1.0257568359375, 1.0662384033203125, 1.106719970703125, 1.1472015380859375, 1.18768310546875, 1.2281646728515625, 1.268646240234375, 1.3091278076171875, 1.349609375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 8.0, 9.0, 16.0, 27.0, 39.0, 63.0, 103.0, 161.0, 282.0, 617.0, 1377.0, 4309.0, 20513.0, 162677.0, 629782.0, 196792.0, 24055.0, 4790.0, 1583.0, 634.0, 299.0, 172.0, 100.0, 46.0, 32.0, 21.0, 14.0, 10.0, 8.0, 4.0, 1.0, 5.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.669921875, -0.6505279541015625, -0.631134033203125, -0.6117401123046875, -0.59234619140625, -0.5729522705078125, -0.553558349609375, -0.5341644287109375, -0.5147705078125, -0.4953765869140625, -0.475982666015625, -0.4565887451171875, -0.43719482421875, -0.4178009033203125, -0.398406982421875, -0.3790130615234375, -0.359619140625, -0.3402252197265625, -0.320831298828125, -0.3014373779296875, -0.28204345703125, -0.2626495361328125, -0.243255615234375, -0.2238616943359375, -0.2044677734375, -0.1850738525390625, -0.165679931640625, -0.1462860107421875, -0.12689208984375, -0.1074981689453125, -0.088104248046875, -0.0687103271484375, -0.04931640625, -0.0299224853515625, -0.010528564453125, 0.0088653564453125, 0.02825927734375, 0.0476531982421875, 0.067047119140625, 0.0864410400390625, 0.1058349609375, 0.1252288818359375, 0.144622802734375, 0.1640167236328125, 0.18341064453125, 0.2028045654296875, 0.222198486328125, 0.2415924072265625, 0.260986328125, 0.2803802490234375, 0.299774169921875, 0.3191680908203125, 0.33856201171875, 0.3579559326171875, 0.377349853515625, 0.3967437744140625, 0.4161376953125, 0.4355316162109375, 0.454925537109375, 0.4743194580078125, 0.49371337890625, 0.5131072998046875, 0.532501220703125, 0.5518951416015625, 0.5712890625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 9.0, 9.0, 5.0, 7.0, 16.0, 20.0, 20.0, 28.0, 40.0, 39.0, 32.0, 66.0, 67.0, 90.0, 86.0, 91.0, 78.0, 63.0, 55.0, 45.0, 26.0, 20.0, 34.0, 12.0, 17.0, 8.0, 7.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0], "bins": [-0.00010198354721069336, -9.93385910987854e-05, -9.669363498687744e-05, -9.404867887496948e-05, -9.140372276306152e-05, -8.875876665115356e-05, -8.61138105392456e-05, -8.346885442733765e-05, -8.082389831542969e-05, -7.817894220352173e-05, -7.553398609161377e-05, -7.288902997970581e-05, -7.024407386779785e-05, -6.759911775588989e-05, -6.495416164398193e-05, -6.230920553207397e-05, -5.9664249420166016e-05, -5.701929330825806e-05, -5.43743371963501e-05, -5.172938108444214e-05, -4.908442497253418e-05, -4.643946886062622e-05, -4.379451274871826e-05, -4.11495566368103e-05, -3.8504600524902344e-05, -3.5859644412994385e-05, -3.3214688301086426e-05, -3.056973218917847e-05, -2.7924776077270508e-05, -2.527981996536255e-05, -2.263486385345459e-05, -1.998990774154663e-05, -1.7344951629638672e-05, -1.4699995517730713e-05, -1.2055039405822754e-05, -9.410083293914795e-06, -6.765127182006836e-06, -4.120171070098877e-06, -1.475214958190918e-06, 1.169741153717041e-06, 3.814697265625e-06, 6.459653377532959e-06, 9.104609489440918e-06, 1.1749565601348877e-05, 1.4394521713256836e-05, 1.7039477825164795e-05, 1.9684433937072754e-05, 2.2329390048980713e-05, 2.4974346160888672e-05, 2.761930227279663e-05, 3.026425838470459e-05, 3.290921449661255e-05, 3.555417060852051e-05, 3.819912672042847e-05, 4.0844082832336426e-05, 4.3489038944244385e-05, 4.6133995056152344e-05, 4.87789511680603e-05, 5.142390727996826e-05, 5.406886339187622e-05, 5.671381950378418e-05, 5.935877561569214e-05, 6.20037317276001e-05, 6.464868783950806e-05, 6.729364395141602e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 9.0, 3.0, 5.0, 5.0, 12.0, 23.0, 34.0, 47.0, 92.0, 142.0, 247.0, 478.0, 925.0, 2345.0, 6628.0, 25313.0, 126810.0, 484769.0, 317235.0, 62270.0, 13981.0, 4137.0, 1531.0, 682.0, 365.0, 197.0, 103.0, 62.0, 45.0, 24.0, 11.0, 5.0, 8.0, 3.0, 2.0, 4.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.42236328125, -0.40769195556640625, -0.3930206298828125, -0.37834930419921875, -0.363677978515625, -0.34900665283203125, -0.3343353271484375, -0.31966400146484375, -0.30499267578125, -0.29032135009765625, -0.2756500244140625, -0.26097869873046875, -0.246307373046875, -0.23163604736328125, -0.2169647216796875, -0.20229339599609375, -0.1876220703125, -0.17295074462890625, -0.1582794189453125, -0.14360809326171875, -0.128936767578125, -0.11426544189453125, -0.0995941162109375, -0.08492279052734375, -0.07025146484375, -0.05558013916015625, -0.0409088134765625, -0.02623748779296875, -0.011566162109375, 0.00310516357421875, 0.0177764892578125, 0.03244781494140625, 0.047119140625, 0.06179046630859375, 0.0764617919921875, 0.09113311767578125, 0.105804443359375, 0.12047576904296875, 0.1351470947265625, 0.14981842041015625, 0.16448974609375, 0.17916107177734375, 0.1938323974609375, 0.20850372314453125, 0.223175048828125, 0.23784637451171875, 0.2525177001953125, 0.26718902587890625, 0.2818603515625, 0.29653167724609375, 0.3112030029296875, 0.32587432861328125, 0.340545654296875, 0.35521697998046875, 0.3698883056640625, 0.38455963134765625, 0.39923095703125, 0.41390228271484375, 0.4285736083984375, 0.44324493408203125, 0.457916259765625, 0.47258758544921875, 0.4872589111328125, 0.5019302368164062, 0.5166015625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 5.0, 3.0, 7.0, 7.0, 10.0, 11.0, 24.0, 39.0, 27.0, 48.0, 81.0, 93.0, 94.0, 116.0, 88.0, 84.0, 69.0, 47.0, 44.0, 30.0, 22.0, 17.0, 16.0, 10.0, 10.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.321533203125, -0.3066825866699219, -0.29183197021484375, -0.2769813537597656, -0.2621307373046875, -0.24728012084960938, -0.23242950439453125, -0.21757888793945312, -0.202728271484375, -0.18787765502929688, -0.17302703857421875, -0.15817642211914062, -0.1433258056640625, -0.12847518920898438, -0.11362457275390625, -0.09877395629882812, -0.08392333984375, -0.06907272338867188, -0.05422210693359375, -0.039371490478515625, -0.0245208740234375, -0.009670257568359375, 0.00518035888671875, 0.020030975341796875, 0.034881591796875, 0.049732208251953125, 0.06458282470703125, 0.07943344116210938, 0.0942840576171875, 0.10913467407226562, 0.12398529052734375, 0.13883590698242188, 0.1536865234375, 0.16853713989257812, 0.18338775634765625, 0.19823837280273438, 0.2130889892578125, 0.22793960571289062, 0.24279022216796875, 0.2576408386230469, 0.272491455078125, 0.2873420715332031, 0.30219268798828125, 0.3170433044433594, 0.3318939208984375, 0.3467445373535156, 0.36159515380859375, 0.3764457702636719, 0.39129638671875, 0.4061470031738281, 0.42099761962890625, 0.4358482360839844, 0.4506988525390625, 0.4655494689941406, 0.48040008544921875, 0.4952507019042969, 0.510101318359375, 0.5249519348144531, 0.5398025512695312, 0.5546531677246094, 0.5695037841796875, 0.5843544006347656, 0.5992050170898438, 0.6140556335449219, 0.62890625]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 6.0, 9.0, 2.0, 7.0, 10.0, 18.0, 21.0, 44.0, 57.0, 94.0, 142.0, 130.0, 140.0, 107.0, 79.0, 52.0, 29.0, 19.0, 17.0, 5.0, 3.0, 5.0, 6.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-8.574131965637207, -8.32158088684082, -8.069028854370117, -7.816477298736572, -7.563925743103027, -7.311374187469482, -7.0588226318359375, -6.806271076202393, -6.553719520568848, -6.301167964935303, -6.048616409301758, -5.796064853668213, -5.543513298034668, -5.290961742401123, -5.038410186767578, -4.785858631134033, -4.533307075500488, -4.280755519866943, -4.028203964233398, -3.7756524085998535, -3.5231008529663086, -3.2705492973327637, -3.0179977416992188, -2.765446186065674, -2.512894630432129, -2.260343074798584, -2.007791519165039, -1.7552399635314941, -1.5026884078979492, -1.2501368522644043, -0.9975852966308594, -0.7450337409973145, -0.49248218536376953, -0.2399306297302246, 0.012620925903320312, 0.26517248153686523, 0.5177240371704102, 0.7702755928039551, 1.0228271484375, 1.275378704071045, 1.5279302597045898, 1.7804818153381348, 2.0330333709716797, 2.2855849266052246, 2.5381364822387695, 2.7906880378723145, 3.0432395935058594, 3.2957911491394043, 3.548342704772949, 3.800894260406494, 4.053445816040039, 4.305997371673584, 4.558548927307129, 4.811100482940674, 5.063652038574219, 5.316203594207764, 5.568755149841309, 5.8213067054748535, 6.073858261108398, 6.326409816741943, 6.578961372375488, 6.831512928009033, 7.084064483642578, 7.336616039276123, 7.589167594909668]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 5.0, 4.0, 4.0, 7.0, 2.0, 8.0, 10.0, 17.0, 11.0, 16.0, 19.0, 25.0, 27.0, 25.0, 32.0, 30.0, 24.0, 34.0, 32.0, 38.0, 54.0, 42.0, 33.0, 50.0, 42.0, 32.0, 48.0, 38.0, 52.0, 36.0, 30.0, 29.0, 18.0, 18.0, 14.0, 16.0, 16.0, 11.0, 13.0, 15.0, 7.0, 9.0, 4.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.057811737060547, -4.880091667175293, -4.702371120452881, -4.524651050567627, -4.346930980682373, -4.169210433959961, -3.991490364074707, -3.813770055770874, -3.636049747467041, -3.458329439163208, -3.280609369277954, -3.102889060974121, -2.925168752670288, -2.747448444366455, -2.569728374481201, -2.392008066177368, -2.2142879962921143, -2.0365676879882812, -1.8588474988937378, -1.6811273097991943, -1.5034070014953613, -1.3256868124008179, -1.1479666233062744, -0.9702463150024414, -0.792526125907898, -0.6148058772087097, -0.43708565831184387, -0.259365439414978, -0.0816451907157898, 0.09607505798339844, 0.2737952470779419, 0.4515155553817749, 0.6292357444763184, 0.8069559931755066, 0.9846762418746948, 1.1623964309692383, 1.3401167392730713, 1.5178369283676147, 1.6955571174621582, 1.8732774257659912, 2.050997734069824, 2.2287180423736572, 2.406438112258911, 2.584158420562744, 2.761878728866577, 2.93959903717041, 3.117319107055664, 3.295039415359497, 3.472759485244751, 3.650479793548584, 3.828199863433838, 4.00592041015625, 4.183640480041504, 4.361360549926758, 4.539080619812012, 4.716801166534424, 4.894521236419678, 5.072241306304932, 5.249961853027344, 5.427681922912598, 5.605401992797852, 5.783122539520264, 5.960842609405518, 6.13856315612793, 6.316283226013184]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 6.0, 1.0, 6.0, 9.0, 10.0, 8.0, 19.0, 23.0, 33.0, 54.0, 78.0, 112.0, 211.0, 379.0, 635.0, 1261.0, 3009.0, 11725.0, 112893.0, 3965518.0, 83878.0, 9656.0, 2550.0, 1022.0, 486.0, 304.0, 138.0, 101.0, 52.0, 43.0, 17.0, 16.0, 15.0, 3.0, 4.0, 2.0, 6.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.1015625, -3.0059814453125, -2.910400390625, -2.8148193359375, -2.71923828125, -2.6236572265625, -2.528076171875, -2.4324951171875, -2.3369140625, -2.2413330078125, -2.145751953125, -2.0501708984375, -1.95458984375, -1.8590087890625, -1.763427734375, -1.6678466796875, -1.572265625, -1.4766845703125, -1.381103515625, -1.2855224609375, -1.18994140625, -1.0943603515625, -0.998779296875, -0.9031982421875, -0.8076171875, -0.7120361328125, -0.616455078125, -0.5208740234375, -0.42529296875, -0.3297119140625, -0.234130859375, -0.1385498046875, -0.04296875, 0.0526123046875, 0.148193359375, 0.2437744140625, 0.33935546875, 0.4349365234375, 0.530517578125, 0.6260986328125, 0.7216796875, 0.8172607421875, 0.912841796875, 1.0084228515625, 1.10400390625, 1.1995849609375, 1.295166015625, 1.3907470703125, 1.486328125, 1.5819091796875, 1.677490234375, 1.7730712890625, 1.86865234375, 1.9642333984375, 2.059814453125, 2.1553955078125, 2.2509765625, 2.3465576171875, 2.442138671875, 2.5377197265625, 2.63330078125, 2.7288818359375, 2.824462890625, 2.9200439453125, 3.015625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 8.0, 6.0, 11.0, 25.0, 28.0, 45.0, 72.0, 102.0, 112.0, 108.0, 120.0, 96.0, 84.0, 68.0, 40.0, 23.0, 18.0, 12.0, 9.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.6279296875, -0.6087417602539062, -0.5895538330078125, -0.5703659057617188, -0.551177978515625, -0.5319900512695312, -0.5128021240234375, -0.49361419677734375, -0.47442626953125, -0.45523834228515625, -0.4360504150390625, -0.41686248779296875, -0.397674560546875, -0.37848663330078125, -0.3592987060546875, -0.34011077880859375, -0.3209228515625, -0.30173492431640625, -0.2825469970703125, -0.26335906982421875, -0.244171142578125, -0.22498321533203125, -0.2057952880859375, -0.18660736083984375, -0.16741943359375, -0.14823150634765625, -0.1290435791015625, -0.10985565185546875, -0.090667724609375, -0.07147979736328125, -0.0522918701171875, -0.03310394287109375, -0.013916015625, 0.00527191162109375, 0.0244598388671875, 0.04364776611328125, 0.062835693359375, 0.08202362060546875, 0.1012115478515625, 0.12039947509765625, 0.13958740234375, 0.15877532958984375, 0.1779632568359375, 0.19715118408203125, 0.216339111328125, 0.23552703857421875, 0.2547149658203125, 0.27390289306640625, 0.2930908203125, 0.31227874755859375, 0.3314666748046875, 0.35065460205078125, 0.369842529296875, 0.38903045654296875, 0.4082183837890625, 0.42740631103515625, 0.44659423828125, 0.46578216552734375, 0.4849700927734375, 0.5041580200195312, 0.523345947265625, 0.5425338745117188, 0.5617218017578125, 0.5809097290039062, 0.60009765625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 3.0, 2.0, 9.0, 10.0, 9.0, 16.0, 14.0, 22.0, 48.0, 43.0, 70.0, 103.0, 165.0, 274.0, 468.0, 1213.0, 3821.0, 21926.0, 632759.0, 3479291.0, 45092.0, 5833.0, 1652.0, 561.0, 305.0, 152.0, 110.0, 79.0, 53.0, 47.0, 25.0, 30.0, 27.0, 9.0, 9.0, 9.0, 5.0, 4.0, 5.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1171875, -2.041961669921875, -1.96673583984375, -1.891510009765625, -1.8162841796875, -1.741058349609375, -1.66583251953125, -1.590606689453125, -1.515380859375, -1.440155029296875, -1.36492919921875, -1.289703369140625, -1.2144775390625, -1.139251708984375, -1.06402587890625, -0.988800048828125, -0.91357421875, -0.838348388671875, -0.76312255859375, -0.687896728515625, -0.6126708984375, -0.537445068359375, -0.46221923828125, -0.386993408203125, -0.311767578125, -0.236541748046875, -0.16131591796875, -0.086090087890625, -0.0108642578125, 0.064361572265625, 0.13958740234375, 0.214813232421875, 0.2900390625, 0.365264892578125, 0.44049072265625, 0.515716552734375, 0.5909423828125, 0.666168212890625, 0.74139404296875, 0.816619873046875, 0.891845703125, 0.967071533203125, 1.04229736328125, 1.117523193359375, 1.1927490234375, 1.267974853515625, 1.34320068359375, 1.418426513671875, 1.49365234375, 1.568878173828125, 1.64410400390625, 1.719329833984375, 1.7945556640625, 1.869781494140625, 1.94500732421875, 2.020233154296875, 2.095458984375, 2.170684814453125, 2.24591064453125, 2.321136474609375, 2.3963623046875, 2.471588134765625, 2.54681396484375, 2.622039794921875, 2.697265625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 6.0, 16.0, 37.0, 101.0, 441.0, 2614.0, 636.0, 134.0, 50.0, 20.0, 12.0, 7.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.115234375, -1.065948486328125, -1.01666259765625, -0.967376708984375, -0.9180908203125, -0.868804931640625, -0.81951904296875, -0.770233154296875, -0.720947265625, -0.671661376953125, -0.62237548828125, -0.573089599609375, -0.5238037109375, -0.474517822265625, -0.42523193359375, -0.375946044921875, -0.32666015625, -0.277374267578125, -0.22808837890625, -0.178802490234375, -0.1295166015625, -0.080230712890625, -0.03094482421875, 0.018341064453125, 0.067626953125, 0.116912841796875, 0.16619873046875, 0.215484619140625, 0.2647705078125, 0.314056396484375, 0.36334228515625, 0.412628173828125, 0.4619140625, 0.511199951171875, 0.56048583984375, 0.609771728515625, 0.6590576171875, 0.708343505859375, 0.75762939453125, 0.806915283203125, 0.856201171875, 0.905487060546875, 0.95477294921875, 1.004058837890625, 1.0533447265625, 1.102630615234375, 1.15191650390625, 1.201202392578125, 1.25048828125, 1.299774169921875, 1.34906005859375, 1.398345947265625, 1.4476318359375, 1.496917724609375, 1.54620361328125, 1.595489501953125, 1.644775390625, 1.694061279296875, 1.74334716796875, 1.792633056640625, 1.8419189453125, 1.891204833984375, 1.94049072265625, 1.989776611328125, 2.0390625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 9.0, 8.0, 33.0, 67.0, 154.0, 230.0, 236.0, 139.0, 68.0, 37.0, 14.0, 3.0, 6.0, 1.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.674568176269531, -7.492204666137695, -7.309841156005859, -7.127477645874023, -6.9451141357421875, -6.762750148773193, -6.580386638641357, -6.3980231285095215, -6.2156596183776855, -6.03329610824585, -5.850932598114014, -5.668569087982178, -5.486205101013184, -5.303841590881348, -5.121478080749512, -4.939114570617676, -4.75675106048584, -4.574387550354004, -4.392024040222168, -4.209660530090332, -4.027297019958496, -3.844933271408081, -3.662569522857666, -3.48020601272583, -3.297842502593994, -3.115478992462158, -2.9331154823303223, -2.7507517337799072, -2.5683882236480713, -2.3860247135162354, -2.2036609649658203, -2.0212974548339844, -1.8389344215393066, -1.6565709114074707, -1.4742072820663452, -1.2918436527252197, -1.1094801425933838, -0.9271165728569031, -0.7447530031204224, -0.5623893737792969, -0.38002586364746094, -0.19766229391098022, -0.015298724174499512, 0.1670648455619812, 0.3494284152984619, 0.5317919850349426, 0.7141555547714233, 0.8965191841125488, 1.0788826942443848, 1.2612462043762207, 1.4436098337173462, 1.6259734630584717, 1.8083369731903076, 1.9907004833221436, 2.1730642318725586, 2.3554277420043945, 2.5377912521362305, 2.7201547622680664, 2.9025182723999023, 3.0848820209503174, 3.2672455310821533, 3.4496090412139893, 3.6319727897644043, 3.8143362998962402, 3.996699810028076]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 5.0, 9.0, 11.0, 13.0, 11.0, 21.0, 28.0, 41.0, 42.0, 61.0, 51.0, 71.0, 81.0, 84.0, 84.0, 75.0, 57.0, 54.0, 58.0, 40.0, 33.0, 17.0, 24.0, 10.0, 11.0, 4.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.150228977203369, -3.053276538848877, -2.956324338912964, -2.859372138977051, -2.7624197006225586, -2.6654672622680664, -2.5685150623321533, -2.4715628623962402, -2.374610424041748, -2.277657985687256, -2.1807057857513428, -2.0837535858154297, -1.9868011474609375, -1.8898488283157349, -1.7928965091705322, -1.6959441900253296, -1.598991870880127, -1.5020395517349243, -1.4050872325897217, -1.308134913444519, -1.2111825942993164, -1.1142302751541138, -1.0172779560089111, -0.9203256368637085, -0.8233733177185059, -0.7264209985733032, -0.6294686794281006, -0.532516360282898, -0.4355640411376953, -0.3386117219924927, -0.24165940284729004, -0.1447070837020874, -0.047754764556884766, 0.04919755458831787, 0.1461498737335205, 0.24310219287872314, 0.3400545120239258, 0.4370068311691284, 0.533959150314331, 0.6309114694595337, 0.7278637886047363, 0.824816107749939, 0.9217684268951416, 1.0187207460403442, 1.1156730651855469, 1.2126253843307495, 1.3095777034759521, 1.4065300226211548, 1.5034823417663574, 1.60043466091156, 1.6973869800567627, 1.7943392992019653, 1.891291618347168, 1.9882439374923706, 2.0851962566375732, 2.1821484565734863, 2.2791008949279785, 2.3760533332824707, 2.473005533218384, 2.569957733154297, 2.666910171508789, 2.7638626098632812, 2.8608148097991943, 2.9577670097351074, 3.0547194480895996]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 5.0, 3.0, 12.0, 10.0, 11.0, 21.0, 29.0, 39.0, 55.0, 88.0, 155.0, 268.0, 411.0, 830.0, 1600.0, 3588.0, 10924.0, 81771.0, 742213.0, 179336.0, 18080.0, 4742.0, 2061.0, 997.0, 509.0, 271.0, 185.0, 112.0, 81.0, 42.0, 31.0, 20.0, 11.0, 4.0, 9.0, 4.0, 4.0, 3.0, 4.0, 3.0, 2.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.611328125, -2.52325439453125, -2.4351806640625, -2.34710693359375, -2.259033203125, -2.17095947265625, -2.0828857421875, -1.99481201171875, -1.90673828125, -1.81866455078125, -1.7305908203125, -1.64251708984375, -1.554443359375, -1.46636962890625, -1.3782958984375, -1.29022216796875, -1.2021484375, -1.11407470703125, -1.0260009765625, -0.93792724609375, -0.849853515625, -0.76177978515625, -0.6737060546875, -0.58563232421875, -0.49755859375, -0.40948486328125, -0.3214111328125, -0.23333740234375, -0.145263671875, -0.05718994140625, 0.0308837890625, 0.11895751953125, 0.20703125, 0.29510498046875, 0.3831787109375, 0.47125244140625, 0.559326171875, 0.64739990234375, 0.7354736328125, 0.82354736328125, 0.91162109375, 0.99969482421875, 1.0877685546875, 1.17584228515625, 1.263916015625, 1.35198974609375, 1.4400634765625, 1.52813720703125, 1.6162109375, 1.70428466796875, 1.7923583984375, 1.88043212890625, 1.968505859375, 2.05657958984375, 2.1446533203125, 2.23272705078125, 2.32080078125, 2.40887451171875, 2.4969482421875, 2.58502197265625, 2.673095703125, 2.76116943359375, 2.8492431640625, 2.93731689453125, 3.025390625]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 7.0, 11.0, 12.0, 25.0, 36.0, 53.0, 76.0, 104.0, 116.0, 114.0, 113.0, 108.0, 69.0, 59.0, 32.0, 23.0, 16.0, 8.0, 5.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.66552734375, -0.6450347900390625, -0.624542236328125, -0.6040496826171875, -0.58355712890625, -0.5630645751953125, -0.542572021484375, -0.5220794677734375, -0.5015869140625, -0.4810943603515625, -0.460601806640625, -0.4401092529296875, -0.41961669921875, -0.3991241455078125, -0.378631591796875, -0.3581390380859375, -0.337646484375, -0.3171539306640625, -0.296661376953125, -0.2761688232421875, -0.25567626953125, -0.2351837158203125, -0.214691162109375, -0.1941986083984375, -0.1737060546875, -0.1532135009765625, -0.132720947265625, -0.1122283935546875, -0.09173583984375, -0.0712432861328125, -0.050750732421875, -0.0302581787109375, -0.009765625, 0.0107269287109375, 0.031219482421875, 0.0517120361328125, 0.07220458984375, 0.0926971435546875, 0.113189697265625, 0.1336822509765625, 0.1541748046875, 0.1746673583984375, 0.195159912109375, 0.2156524658203125, 0.23614501953125, 0.2566375732421875, 0.277130126953125, 0.2976226806640625, 0.318115234375, 0.3386077880859375, 0.359100341796875, 0.3795928955078125, 0.40008544921875, 0.4205780029296875, 0.441070556640625, 0.4615631103515625, 0.4820556640625, 0.5025482177734375, 0.523040771484375, 0.5435333251953125, 0.56402587890625, 0.5845184326171875, 0.605010986328125, 0.6255035400390625, 0.64599609375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 4.0, 2.0, 1.0, 8.0, 9.0, 12.0, 14.0, 15.0, 24.0, 28.0, 41.0, 68.0, 93.0, 143.0, 212.0, 336.0, 679.0, 1482.0, 3619.0, 10272.0, 37078.0, 153646.0, 496753.0, 258198.0, 60478.0, 16191.0, 5098.0, 1969.0, 873.0, 420.0, 243.0, 175.0, 92.0, 68.0, 49.0, 41.0, 33.0, 21.0, 18.0, 10.0, 8.0, 7.0, 4.0, 7.0, 5.0, 5.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-1.220703125, -1.1855010986328125, -1.150299072265625, -1.1150970458984375, -1.07989501953125, -1.0446929931640625, -1.009490966796875, -0.9742889404296875, -0.9390869140625, -0.9038848876953125, -0.868682861328125, -0.8334808349609375, -0.79827880859375, -0.7630767822265625, -0.727874755859375, -0.6926727294921875, -0.657470703125, -0.6222686767578125, -0.587066650390625, -0.5518646240234375, -0.51666259765625, -0.4814605712890625, -0.446258544921875, -0.4110565185546875, -0.3758544921875, -0.3406524658203125, -0.305450439453125, -0.2702484130859375, -0.23504638671875, -0.1998443603515625, -0.164642333984375, -0.1294403076171875, -0.09423828125, -0.0590362548828125, -0.023834228515625, 0.0113677978515625, 0.04656982421875, 0.0817718505859375, 0.116973876953125, 0.1521759033203125, 0.1873779296875, 0.2225799560546875, 0.257781982421875, 0.2929840087890625, 0.32818603515625, 0.3633880615234375, 0.398590087890625, 0.4337921142578125, 0.468994140625, 0.5041961669921875, 0.539398193359375, 0.5746002197265625, 0.60980224609375, 0.6450042724609375, 0.680206298828125, 0.7154083251953125, 0.7506103515625, 0.7858123779296875, 0.821014404296875, 0.8562164306640625, 0.89141845703125, 0.9266204833984375, 0.961822509765625, 0.9970245361328125, 1.0322265625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 9.0, 7.0, 1.0, 9.0, 11.0, 10.0, 19.0, 19.0, 18.0, 29.0, 17.0, 18.0, 36.0, 29.0, 30.0, 37.0, 38.0, 40.0, 52.0, 45.0, 51.0, 36.0, 42.0, 42.0, 46.0, 33.0, 29.0, 32.0, 29.0, 33.0, 19.0, 22.0, 20.0, 17.0, 17.0, 15.0, 7.0, 5.0, 8.0, 5.0, 3.0, 2.0, 4.0, 5.0, 3.0, 0.0, 3.0, 0.0, 2.0, 3.0], "bins": [-1.1005859375, -1.0685272216796875, -1.036468505859375, -1.0044097900390625, -0.97235107421875, -0.9402923583984375, -0.908233642578125, -0.8761749267578125, -0.8441162109375, -0.8120574951171875, -0.779998779296875, -0.7479400634765625, -0.71588134765625, -0.6838226318359375, -0.651763916015625, -0.6197052001953125, -0.587646484375, -0.5555877685546875, -0.523529052734375, -0.4914703369140625, -0.45941162109375, -0.4273529052734375, -0.395294189453125, -0.3632354736328125, -0.3311767578125, -0.2991180419921875, -0.267059326171875, -0.2350006103515625, -0.20294189453125, -0.1708831787109375, -0.138824462890625, -0.1067657470703125, -0.07470703125, -0.0426483154296875, -0.010589599609375, 0.0214691162109375, 0.05352783203125, 0.0855865478515625, 0.117645263671875, 0.1497039794921875, 0.1817626953125, 0.2138214111328125, 0.245880126953125, 0.2779388427734375, 0.30999755859375, 0.3420562744140625, 0.374114990234375, 0.4061737060546875, 0.438232421875, 0.4702911376953125, 0.502349853515625, 0.5344085693359375, 0.56646728515625, 0.5985260009765625, 0.630584716796875, 0.6626434326171875, 0.6947021484375, 0.7267608642578125, 0.758819580078125, 0.7908782958984375, 0.82293701171875, 0.8549957275390625, 0.887054443359375, 0.9191131591796875, 0.951171875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 4.0, 8.0, 11.0, 28.0, 23.0, 43.0, 109.0, 227.0, 655.0, 2589.0, 26418.0, 838266.0, 171438.0, 6882.0, 1141.0, 406.0, 125.0, 80.0, 47.0, 20.0, 19.0, 8.0, 1.0, 5.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.197265625, -1.1595458984375, -1.121826171875, -1.0841064453125, -1.04638671875, -1.0086669921875, -0.970947265625, -0.9332275390625, -0.8955078125, -0.8577880859375, -0.820068359375, -0.7823486328125, -0.74462890625, -0.7069091796875, -0.669189453125, -0.6314697265625, -0.59375, -0.5560302734375, -0.518310546875, -0.4805908203125, -0.44287109375, -0.4051513671875, -0.367431640625, -0.3297119140625, -0.2919921875, -0.2542724609375, -0.216552734375, -0.1788330078125, -0.14111328125, -0.1033935546875, -0.065673828125, -0.0279541015625, 0.009765625, 0.0474853515625, 0.085205078125, 0.1229248046875, 0.16064453125, 0.1983642578125, 0.236083984375, 0.2738037109375, 0.3115234375, 0.3492431640625, 0.386962890625, 0.4246826171875, 0.46240234375, 0.5001220703125, 0.537841796875, 0.5755615234375, 0.61328125, 0.6510009765625, 0.688720703125, 0.7264404296875, 0.76416015625, 0.8018798828125, 0.839599609375, 0.8773193359375, 0.9150390625, 0.9527587890625, 0.990478515625, 1.0281982421875, 1.06591796875, 1.1036376953125, 1.141357421875, 1.1790771484375, 1.216796875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 3.0, 1.0, 8.0, 5.0, 5.0, 6.0, 12.0, 11.0, 15.0, 18.0, 22.0, 39.0, 46.0, 67.0, 59.0, 83.0, 91.0, 102.0, 78.0, 66.0, 54.0, 43.0, 31.0, 26.0, 25.0, 14.0, 15.0, 8.0, 20.0, 5.0, 6.0, 3.0, 2.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.779764175415039e-05, -8.535757660865784e-05, -8.291751146316528e-05, -8.047744631767273e-05, -7.803738117218018e-05, -7.559731602668762e-05, -7.315725088119507e-05, -7.071718573570251e-05, -6.827712059020996e-05, -6.583705544471741e-05, -6.339699029922485e-05, -6.09569251537323e-05, -5.8516860008239746e-05, -5.607679486274719e-05, -5.363672971725464e-05, -5.1196664571762085e-05, -4.875659942626953e-05, -4.631653428077698e-05, -4.3876469135284424e-05, -4.143640398979187e-05, -3.8996338844299316e-05, -3.655627369880676e-05, -3.411620855331421e-05, -3.1676143407821655e-05, -2.92360782623291e-05, -2.6796013116836548e-05, -2.4355947971343994e-05, -2.191588282585144e-05, -1.9475817680358887e-05, -1.7035752534866333e-05, -1.459568738937378e-05, -1.2155622243881226e-05, -9.715557098388672e-06, -7.275491952896118e-06, -4.8354268074035645e-06, -2.3953616619110107e-06, 4.470348358154297e-08, 2.4847686290740967e-06, 4.92483377456665e-06, 7.364898920059204e-06, 9.804964065551758e-06, 1.2245029211044312e-05, 1.4685094356536865e-05, 1.712515950202942e-05, 1.9565224647521973e-05, 2.2005289793014526e-05, 2.444535493850708e-05, 2.6885420083999634e-05, 2.9325485229492188e-05, 3.176555037498474e-05, 3.4205615520477295e-05, 3.664568066596985e-05, 3.90857458114624e-05, 4.1525810956954956e-05, 4.396587610244751e-05, 4.6405941247940063e-05, 4.884600639343262e-05, 5.128607153892517e-05, 5.3726136684417725e-05, 5.616620182991028e-05, 5.860626697540283e-05, 6.104633212089539e-05, 6.348639726638794e-05, 6.592646241188049e-05, 6.836652755737305e-05]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 1.0, 6.0, 8.0, 15.0, 20.0, 34.0, 64.0, 82.0, 149.0, 443.0, 2122.0, 37973.0, 971714.0, 33079.0, 2016.0, 456.0, 159.0, 89.0, 53.0, 30.0, 16.0, 12.0, 9.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-2.01171875, -1.9607696533203125, -1.909820556640625, -1.8588714599609375, -1.80792236328125, -1.7569732666015625, -1.706024169921875, -1.6550750732421875, -1.6041259765625, -1.5531768798828125, -1.502227783203125, -1.4512786865234375, -1.40032958984375, -1.3493804931640625, -1.298431396484375, -1.2474822998046875, -1.196533203125, -1.1455841064453125, -1.094635009765625, -1.0436859130859375, -0.99273681640625, -0.9417877197265625, -0.890838623046875, -0.8398895263671875, -0.7889404296875, -0.7379913330078125, -0.687042236328125, -0.6360931396484375, -0.58514404296875, -0.5341949462890625, -0.483245849609375, -0.4322967529296875, -0.38134765625, -0.3303985595703125, -0.279449462890625, -0.2285003662109375, -0.17755126953125, -0.1266021728515625, -0.075653076171875, -0.0247039794921875, 0.0262451171875, 0.0771942138671875, 0.128143310546875, 0.1790924072265625, 0.23004150390625, 0.2809906005859375, 0.331939697265625, 0.3828887939453125, 0.433837890625, 0.4847869873046875, 0.535736083984375, 0.5866851806640625, 0.63763427734375, 0.6885833740234375, 0.739532470703125, 0.7904815673828125, 0.8414306640625, 0.8923797607421875, 0.943328857421875, 0.9942779541015625, 1.04522705078125, 1.0961761474609375, 1.147125244140625, 1.1980743408203125, 1.2490234375]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 7.0, 5.0, 5.0, 10.0, 15.0, 16.0, 21.0, 23.0, 34.0, 41.0, 49.0, 51.0, 95.0, 97.0, 99.0, 75.0, 82.0, 57.0, 53.0, 40.0, 28.0, 24.0, 18.0, 13.0, 12.0, 9.0, 6.0, 7.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.426513671875, -0.4127540588378906, -0.39899444580078125, -0.3852348327636719, -0.3714752197265625, -0.3577156066894531, -0.34395599365234375, -0.3301963806152344, -0.316436767578125, -0.3026771545410156, -0.28891754150390625, -0.2751579284667969, -0.2613983154296875, -0.24763870239257812, -0.23387908935546875, -0.22011947631835938, -0.20635986328125, -0.19260025024414062, -0.17884063720703125, -0.16508102416992188, -0.1513214111328125, -0.13756179809570312, -0.12380218505859375, -0.11004257202148438, -0.096282958984375, -0.08252334594726562, -0.06876373291015625, -0.055004119873046875, -0.0412445068359375, -0.027484893798828125, -0.01372528076171875, 3.4332275390625e-05, 0.0137939453125, 0.027553558349609375, 0.04131317138671875, 0.055072784423828125, 0.0688323974609375, 0.08259201049804688, 0.09635162353515625, 0.11011123657226562, 0.123870849609375, 0.13763046264648438, 0.15139007568359375, 0.16514968872070312, 0.1789093017578125, 0.19266891479492188, 0.20642852783203125, 0.22018814086914062, 0.23394775390625, 0.24770736694335938, 0.26146697998046875, 0.2752265930175781, 0.2889862060546875, 0.3027458190917969, 0.31650543212890625, 0.3302650451660156, 0.344024658203125, 0.3577842712402344, 0.37154388427734375, 0.3853034973144531, 0.3990631103515625, 0.4128227233886719, 0.42658233642578125, 0.4403419494628906, 0.4541015625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 22.0, 34.0, 157.0, 353.0, 299.0, 110.0, 22.0, 11.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-27.736228942871094, -27.10340690612793, -26.470584869384766, -25.83776092529297, -25.204938888549805, -24.57211685180664, -23.939294815063477, -23.306472778320312, -22.67365074157715, -22.040828704833984, -21.40800666809082, -20.775184631347656, -20.14236068725586, -19.509538650512695, -18.87671661376953, -18.243894577026367, -17.611072540283203, -16.97825050354004, -16.345428466796875, -15.712605476379395, -15.07978343963623, -14.44696044921875, -13.814138412475586, -13.181316375732422, -12.548492431640625, -11.915670394897461, -11.28284740447998, -10.650025367736816, -10.017203330993652, -9.384380340576172, -8.751558303833008, -8.118736267089844, -7.48591423034668, -6.853091716766357, -6.220269680023193, -5.587447166442871, -4.954625129699707, -4.321802616119385, -3.6889801025390625, -3.0561580657958984, -2.423335552215576, -1.790513277053833, -1.1576908826828003, -0.5248684883117676, 0.10795378684997559, 0.7407760620117188, 1.373598575592041, 2.006420612335205, 2.6392431259155273, 3.2720654010772705, 3.9048876762390137, 4.537710189819336, 5.1705322265625, 5.803354740142822, 6.4361772537231445, 7.068999290466309, 7.701821804046631, 8.334644317626953, 8.967466354370117, 9.600288391113281, 10.233111381530762, 10.865933418273926, 11.498756408691406, 12.13157844543457, 12.764400482177734]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 4.0, 9.0, 7.0, 7.0, 9.0, 13.0, 10.0, 15.0, 15.0, 21.0, 20.0, 25.0, 23.0, 32.0, 40.0, 21.0, 39.0, 48.0, 56.0, 46.0, 55.0, 38.0, 45.0, 38.0, 47.0, 45.0, 37.0, 47.0, 26.0, 25.0, 23.0, 19.0, 23.0, 10.0, 11.0, 12.0, 8.0, 13.0, 5.0, 2.0, 5.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-5.246608734130859, -5.0803542137146, -4.914100170135498, -4.747845649719238, -4.581591606140137, -4.415337085723877, -4.249083042144775, -4.082828521728516, -3.916574478149414, -3.7503201961517334, -3.5840659141540527, -3.417811632156372, -3.2515573501586914, -3.0853030681610107, -2.91904878616333, -2.7527942657470703, -2.5865399837493896, -2.420285701751709, -2.2540314197540283, -2.0877771377563477, -1.921522855758667, -1.7552685737609863, -1.5890141725540161, -1.4227598905563354, -1.2565056085586548, -1.0902513265609741, -0.9239970445632935, -0.757742702960968, -0.5914884209632874, -0.4252341389656067, -0.25897979736328125, -0.09272551536560059, 0.07352876663208008, 0.23978306353092194, 0.4060373604297638, 0.5722916722297668, 0.7385459542274475, 0.9048002362251282, 1.0710545778274536, 1.2373088598251343, 1.403563141822815, 1.5698174238204956, 1.7360717058181763, 1.9023261070251465, 2.068580389022827, 2.234834671020508, 2.4010889530181885, 2.567343235015869, 2.73359751701355, 2.8998517990112305, 3.066106081008911, 3.232360363006592, 3.3986146450042725, 3.564868927001953, 3.731123447418213, 3.8973774909973145, 4.063632011413574, 4.229886531829834, 4.3961405754089355, 4.562395095825195, 4.728649139404297, 4.894903659820557, 5.061157703399658, 5.227412223815918, 5.3936662673950195]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 5.0, 3.0, 4.0, 7.0, 10.0, 20.0, 24.0, 32.0, 36.0, 54.0, 83.0, 118.0, 172.0, 266.0, 470.0, 803.0, 1684.0, 4405.0, 17388.0, 228431.0, 3874682.0, 51682.0, 8546.0, 2766.0, 1159.0, 554.0, 311.0, 162.0, 137.0, 78.0, 58.0, 37.0, 29.0, 13.0, 10.0, 17.0, 5.0, 10.0, 1.0, 3.0, 5.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0], "bins": [-2.876953125, -2.79974365234375, -2.7225341796875, -2.64532470703125, -2.568115234375, -2.49090576171875, -2.4136962890625, -2.33648681640625, -2.25927734375, -2.18206787109375, -2.1048583984375, -2.02764892578125, -1.950439453125, -1.87322998046875, -1.7960205078125, -1.71881103515625, -1.6416015625, -1.56439208984375, -1.4871826171875, -1.40997314453125, -1.332763671875, -1.25555419921875, -1.1783447265625, -1.10113525390625, -1.02392578125, -0.94671630859375, -0.8695068359375, -0.79229736328125, -0.715087890625, -0.63787841796875, -0.5606689453125, -0.48345947265625, -0.40625, -0.32904052734375, -0.2518310546875, -0.17462158203125, -0.097412109375, -0.02020263671875, 0.0570068359375, 0.13421630859375, 0.21142578125, 0.28863525390625, 0.3658447265625, 0.44305419921875, 0.520263671875, 0.59747314453125, 0.6746826171875, 0.75189208984375, 0.8291015625, 0.90631103515625, 0.9835205078125, 1.06072998046875, 1.137939453125, 1.21514892578125, 1.2923583984375, 1.36956787109375, 1.44677734375, 1.52398681640625, 1.6011962890625, 1.67840576171875, 1.755615234375, 1.83282470703125, 1.9100341796875, 1.98724365234375, 2.064453125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 7.0, 11.0, 20.0, 37.0, 52.0, 82.0, 100.0, 98.0, 144.0, 94.0, 94.0, 91.0, 55.0, 38.0, 27.0, 17.0, 6.0, 6.0, 2.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.65966796875, -0.6387786865234375, -0.617889404296875, -0.5970001220703125, -0.57611083984375, -0.5552215576171875, -0.534332275390625, -0.5134429931640625, -0.4925537109375, -0.4716644287109375, -0.450775146484375, -0.4298858642578125, -0.40899658203125, -0.3881072998046875, -0.367218017578125, -0.3463287353515625, -0.325439453125, -0.3045501708984375, -0.283660888671875, -0.2627716064453125, -0.24188232421875, -0.2209930419921875, -0.200103759765625, -0.1792144775390625, -0.1583251953125, -0.1374359130859375, -0.116546630859375, -0.0956573486328125, -0.07476806640625, -0.0538787841796875, -0.032989501953125, -0.0121002197265625, 0.0087890625, 0.0296783447265625, 0.050567626953125, 0.0714569091796875, 0.09234619140625, 0.1132354736328125, 0.134124755859375, 0.1550140380859375, 0.1759033203125, 0.1967926025390625, 0.217681884765625, 0.2385711669921875, 0.25946044921875, 0.2803497314453125, 0.301239013671875, 0.3221282958984375, 0.343017578125, 0.3639068603515625, 0.384796142578125, 0.4056854248046875, 0.42657470703125, 0.4474639892578125, 0.468353271484375, 0.4892425537109375, 0.5101318359375, 0.5310211181640625, 0.551910400390625, 0.5727996826171875, 0.59368896484375, 0.6145782470703125, 0.635467529296875, 0.6563568115234375, 0.67724609375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 3.0, 1.0, 6.0, 6.0, 9.0, 8.0, 17.0, 11.0, 27.0, 33.0, 62.0, 90.0, 108.0, 146.0, 257.0, 566.0, 1191.0, 2939.0, 9417.0, 46859.0, 3058069.0, 1022895.0, 38110.0, 8431.0, 2663.0, 1062.0, 533.0, 290.0, 156.0, 97.0, 71.0, 44.0, 32.0, 23.0, 15.0, 3.0, 9.0, 10.0, 8.0, 0.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0], "bins": [-2.34375, -2.2835693359375, -2.223388671875, -2.1632080078125, -2.10302734375, -2.0428466796875, -1.982666015625, -1.9224853515625, -1.8623046875, -1.8021240234375, -1.741943359375, -1.6817626953125, -1.62158203125, -1.5614013671875, -1.501220703125, -1.4410400390625, -1.380859375, -1.3206787109375, -1.260498046875, -1.2003173828125, -1.14013671875, -1.0799560546875, -1.019775390625, -0.9595947265625, -0.8994140625, -0.8392333984375, -0.779052734375, -0.7188720703125, -0.65869140625, -0.5985107421875, -0.538330078125, -0.4781494140625, -0.41796875, -0.3577880859375, -0.297607421875, -0.2374267578125, -0.17724609375, -0.1170654296875, -0.056884765625, 0.0032958984375, 0.0634765625, 0.1236572265625, 0.183837890625, 0.2440185546875, 0.30419921875, 0.3643798828125, 0.424560546875, 0.4847412109375, 0.544921875, 0.6051025390625, 0.665283203125, 0.7254638671875, 0.78564453125, 0.8458251953125, 0.906005859375, 0.9661865234375, 1.0263671875, 1.0865478515625, 1.146728515625, 1.2069091796875, 1.26708984375, 1.3272705078125, 1.387451171875, 1.4476318359375, 1.5078125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 5.0, 3.0, 13.0, 7.0, 29.0, 51.0, 106.0, 353.0, 2512.0, 699.0, 141.0, 69.0, 32.0, 21.0, 16.0, 8.0, 5.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.318359375, -1.2874984741210938, -1.2566375732421875, -1.2257766723632812, -1.194915771484375, -1.1640548706054688, -1.1331939697265625, -1.1023330688476562, -1.07147216796875, -1.0406112670898438, -1.0097503662109375, -0.9788894653320312, -0.948028564453125, -0.9171676635742188, -0.8863067626953125, -0.8554458618164062, -0.8245849609375, -0.7937240600585938, -0.7628631591796875, -0.7320022583007812, -0.701141357421875, -0.6702804565429688, -0.6394195556640625, -0.6085586547851562, -0.57769775390625, -0.5468368530273438, -0.5159759521484375, -0.48511505126953125, -0.454254150390625, -0.42339324951171875, -0.3925323486328125, -0.36167144775390625, -0.330810546875, -0.29994964599609375, -0.2690887451171875, -0.23822784423828125, -0.207366943359375, -0.17650604248046875, -0.1456451416015625, -0.11478424072265625, -0.08392333984375, -0.05306243896484375, -0.0222015380859375, 0.00865936279296875, 0.039520263671875, 0.07038116455078125, 0.1012420654296875, 0.13210296630859375, 0.1629638671875, 0.19382476806640625, 0.2246856689453125, 0.25554656982421875, 0.286407470703125, 0.31726837158203125, 0.3481292724609375, 0.37899017333984375, 0.40985107421875, 0.44071197509765625, 0.4715728759765625, 0.5024337768554688, 0.533294677734375, 0.5641555786132812, 0.5950164794921875, 0.6258773803710938, 0.65673828125]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 7.0, 5.0, 3.0, 10.0, 21.0, 30.0, 70.0, 102.0, 160.0, 212.0, 165.0, 108.0, 55.0, 29.0, 15.0, 9.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6022846698760986, -3.4805939197540283, -3.358903169631958, -3.2372124195098877, -3.1155216693878174, -2.993830919265747, -2.872140407562256, -2.7504496574401855, -2.6287589073181152, -2.507068157196045, -2.3853774070739746, -2.2636866569519043, -2.141995906829834, -2.0203051567077637, -1.898614525794983, -1.7769237756729126, -1.6552329063415527, -1.5335421562194824, -1.411851406097412, -1.2901606559753418, -1.1684699058532715, -1.0467791557312012, -0.9250885248184204, -0.8033977746963501, -0.6817070245742798, -0.5600162744522095, -0.43832555413246155, -0.3166348338127136, -0.1949440836906433, -0.073253333568573, 0.04843735694885254, 0.17012810707092285, 0.29181909561157227, 0.4135098457336426, 0.5352005958557129, 0.6568912863731384, 0.7785820364952087, 0.900272786617279, 1.0219634771347046, 1.143654227256775, 1.2653449773788452, 1.3870357275009155, 1.5087264776229858, 1.6304171085357666, 1.752107858657837, 1.8737986087799072, 1.9954893589019775, 2.117180109024048, 2.238870859146118, 2.3605616092681885, 2.482252359390259, 2.603943109512329, 2.7256338596343994, 2.8473246097564697, 2.969015121459961, 3.0907058715820312, 3.2123966217041016, 3.334087371826172, 3.455778121948242, 3.5774688720703125, 3.699159622192383, 3.820850372314453, 3.9425411224365234, 4.064231872558594, 4.185922622680664]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 10.0, 7.0, 13.0, 18.0, 14.0, 27.0, 42.0, 27.0, 52.0, 55.0, 53.0, 54.0, 68.0, 69.0, 73.0, 58.0, 76.0, 50.0, 49.0, 40.0, 37.0, 33.0, 15.0, 18.0, 13.0, 10.0, 4.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.4217028617858887, -2.3500778675079346, -2.2784526348114014, -2.2068276405334473, -2.135202646255493, -2.063577651977539, -1.9919524192810059, -1.9203274250030518, -1.848702311515808, -1.7770771980285645, -1.7054522037506104, -1.6338270902633667, -1.562201976776123, -1.490576982498169, -1.4189518690109253, -1.3473267555236816, -1.2757017612457275, -1.2040766477584839, -1.1324516534805298, -1.0608265399932861, -0.9892014861106873, -0.9175764322280884, -0.8459513187408447, -0.7743262648582458, -0.702701210975647, -0.6310761570930481, -0.5594511032104492, -0.48782598972320557, -0.4162009358406067, -0.3445758819580078, -0.27295079827308655, -0.20132571458816528, -0.1297008991241455, -0.05807583034038544, 0.013549238443374634, 0.0851743072271347, 0.15679937601089478, 0.22842442989349365, 0.3000495135784149, 0.3716745972633362, 0.44329965114593506, 0.5149247050285339, 0.5865497589111328, 0.6581748723983765, 0.7297999262809753, 0.8014249801635742, 0.8730500936508179, 0.9446751475334167, 1.0163002014160156, 1.0879253149032593, 1.1595503091812134, 1.231175422668457, 1.3028004169464111, 1.3744255304336548, 1.4460506439208984, 1.5176756381988525, 1.5893007516860962, 1.6609258651733398, 1.732550859451294, 1.8041759729385376, 1.8758010864257812, 1.9474260807037354, 2.0190510749816895, 2.0906763076782227, 2.1623013019561768]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 7.0, 8.0, 15.0, 27.0, 64.0, 109.0, 203.0, 468.0, 961.0, 2392.0, 9452.0, 153239.0, 830390.0, 43063.0, 5102.0, 1638.0, 729.0, 337.0, 157.0, 102.0, 29.0, 31.0, 10.0, 8.0, 10.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.390625, -4.26971435546875, -4.1488037109375, -4.02789306640625, -3.906982421875, -3.78607177734375, -3.6651611328125, -3.54425048828125, -3.42333984375, -3.30242919921875, -3.1815185546875, -3.06060791015625, -2.939697265625, -2.81878662109375, -2.6978759765625, -2.57696533203125, -2.4560546875, -2.33514404296875, -2.2142333984375, -2.09332275390625, -1.972412109375, -1.85150146484375, -1.7305908203125, -1.60968017578125, -1.48876953125, -1.36785888671875, -1.2469482421875, -1.12603759765625, -1.005126953125, -0.88421630859375, -0.7633056640625, -0.64239501953125, -0.521484375, -0.40057373046875, -0.2796630859375, -0.15875244140625, -0.037841796875, 0.08306884765625, 0.2039794921875, 0.32489013671875, 0.44580078125, 0.56671142578125, 0.6876220703125, 0.80853271484375, 0.929443359375, 1.05035400390625, 1.1712646484375, 1.29217529296875, 1.4130859375, 1.53399658203125, 1.6549072265625, 1.77581787109375, 1.896728515625, 2.01763916015625, 2.1385498046875, 2.25946044921875, 2.38037109375, 2.50128173828125, 2.6221923828125, 2.74310302734375, 2.864013671875, 2.98492431640625, 3.1058349609375, 3.22674560546875, 3.34765625]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 2.0, 2.0, 16.0, 21.0, 31.0, 70.0, 84.0, 109.0, 113.0, 135.0, 118.0, 86.0, 65.0, 52.0, 45.0, 16.0, 7.0, 10.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.7021484375, -0.6797256469726562, -0.6573028564453125, -0.6348800659179688, -0.612457275390625, -0.5900344848632812, -0.5676116943359375, -0.5451889038085938, -0.52276611328125, -0.5003433227539062, -0.4779205322265625, -0.45549774169921875, -0.433074951171875, -0.41065216064453125, -0.3882293701171875, -0.36580657958984375, -0.3433837890625, -0.32096099853515625, -0.2985382080078125, -0.27611541748046875, -0.253692626953125, -0.23126983642578125, -0.2088470458984375, -0.18642425537109375, -0.16400146484375, -0.14157867431640625, -0.1191558837890625, -0.09673309326171875, -0.074310302734375, -0.05188751220703125, -0.0294647216796875, -0.00704193115234375, 0.015380859375, 0.03780364990234375, 0.0602264404296875, 0.08264923095703125, 0.105072021484375, 0.12749481201171875, 0.1499176025390625, 0.17234039306640625, 0.19476318359375, 0.21718597412109375, 0.2396087646484375, 0.26203155517578125, 0.284454345703125, 0.30687713623046875, 0.3292999267578125, 0.35172271728515625, 0.3741455078125, 0.39656829833984375, 0.4189910888671875, 0.44141387939453125, 0.463836669921875, 0.48625946044921875, 0.5086822509765625, 0.5311050415039062, 0.55352783203125, 0.5759506225585938, 0.5983734130859375, 0.6207962036132812, 0.643218994140625, 0.6656417846679688, 0.6880645751953125, 0.7104873657226562, 0.73291015625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 6.0, 5.0, 3.0, 7.0, 3.0, 11.0, 17.0, 19.0, 21.0, 16.0, 33.0, 36.0, 65.0, 90.0, 92.0, 141.0, 225.0, 404.0, 670.0, 1503.0, 3169.0, 7527.0, 21030.0, 60498.0, 174017.0, 392050.0, 248701.0, 88130.0, 30667.0, 11111.0, 4252.0, 1885.0, 812.0, 493.0, 254.0, 153.0, 114.0, 70.0, 60.0, 55.0, 31.0, 24.0, 24.0, 21.0, 16.0, 8.0, 7.0, 5.0, 7.0, 3.0, 5.0, 1.0, 2.0, 1.0], "bins": [-0.912109375, -0.8865432739257812, -0.8609771728515625, -0.8354110717773438, -0.809844970703125, -0.7842788696289062, -0.7587127685546875, -0.7331466674804688, -0.70758056640625, -0.6820144653320312, -0.6564483642578125, -0.6308822631835938, -0.605316162109375, -0.5797500610351562, -0.5541839599609375, -0.5286178588867188, -0.5030517578125, -0.47748565673828125, -0.4519195556640625, -0.42635345458984375, -0.400787353515625, -0.37522125244140625, -0.3496551513671875, -0.32408905029296875, -0.29852294921875, -0.27295684814453125, -0.2473907470703125, -0.22182464599609375, -0.196258544921875, -0.17069244384765625, -0.1451263427734375, -0.11956024169921875, -0.093994140625, -0.06842803955078125, -0.0428619384765625, -0.01729583740234375, 0.008270263671875, 0.03383636474609375, 0.0594024658203125, 0.08496856689453125, 0.11053466796875, 0.13610076904296875, 0.1616668701171875, 0.18723297119140625, 0.212799072265625, 0.23836517333984375, 0.2639312744140625, 0.28949737548828125, 0.3150634765625, 0.34062957763671875, 0.3661956787109375, 0.39176177978515625, 0.417327880859375, 0.44289398193359375, 0.4684600830078125, 0.49402618408203125, 0.51959228515625, 0.5451583862304688, 0.5707244873046875, 0.5962905883789062, 0.621856689453125, 0.6474227905273438, 0.6729888916015625, 0.6985549926757812, 0.72412109375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 1.0, 6.0, 3.0, 4.0, 10.0, 13.0, 8.0, 12.0, 16.0, 14.0, 19.0, 18.0, 18.0, 36.0, 38.0, 35.0, 43.0, 30.0, 38.0, 36.0, 41.0, 50.0, 41.0, 35.0, 45.0, 43.0, 45.0, 34.0, 37.0, 21.0, 30.0, 26.0, 32.0, 21.0, 16.0, 19.0, 10.0, 18.0, 7.0, 9.0, 5.0, 6.0, 4.0, 3.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.9775390625, -0.9475173950195312, -0.9174957275390625, -0.8874740600585938, -0.857452392578125, -0.8274307250976562, -0.7974090576171875, -0.7673873901367188, -0.73736572265625, -0.7073440551757812, -0.6773223876953125, -0.6473007202148438, -0.617279052734375, -0.5872573852539062, -0.5572357177734375, -0.5272140502929688, -0.4971923828125, -0.46717071533203125, -0.4371490478515625, -0.40712738037109375, -0.377105712890625, -0.34708404541015625, -0.3170623779296875, -0.28704071044921875, -0.25701904296875, -0.22699737548828125, -0.1969757080078125, -0.16695404052734375, -0.136932373046875, -0.10691070556640625, -0.0768890380859375, -0.04686737060546875, -0.016845703125, 0.01317596435546875, 0.0431976318359375, 0.07321929931640625, 0.103240966796875, 0.13326263427734375, 0.1632843017578125, 0.19330596923828125, 0.22332763671875, 0.25334930419921875, 0.2833709716796875, 0.31339263916015625, 0.343414306640625, 0.37343597412109375, 0.4034576416015625, 0.43347930908203125, 0.4635009765625, 0.49352264404296875, 0.5235443115234375, 0.5535659790039062, 0.583587646484375, 0.6136093139648438, 0.6436309814453125, 0.6736526489257812, 0.70367431640625, 0.7336959838867188, 0.7637176513671875, 0.7937393188476562, 0.823760986328125, 0.8537826538085938, 0.8838043212890625, 0.9138259887695312, 0.94384765625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 0.0, 2.0, 2.0, 4.0, 5.0, 6.0, 15.0, 17.0, 19.0, 31.0, 33.0, 64.0, 84.0, 126.0, 181.0, 267.0, 475.0, 839.0, 1862.0, 5082.0, 18995.0, 104653.0, 486940.0, 347572.0, 61980.0, 12310.0, 3619.0, 1535.0, 683.0, 415.0, 259.0, 142.0, 101.0, 64.0, 51.0, 38.0, 18.0, 23.0, 13.0, 10.0, 4.0, 6.0, 5.0, 7.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.390869140625, -0.3773231506347656, -0.36377716064453125, -0.3502311706542969, -0.3366851806640625, -0.3231391906738281, -0.30959320068359375, -0.2960472106933594, -0.282501220703125, -0.2689552307128906, -0.25540924072265625, -0.24186325073242188, -0.2283172607421875, -0.21477127075195312, -0.20122528076171875, -0.18767929077148438, -0.17413330078125, -0.16058731079101562, -0.14704132080078125, -0.13349533081054688, -0.1199493408203125, -0.10640335083007812, -0.09285736083984375, -0.07931137084960938, -0.065765380859375, -0.052219390869140625, -0.03867340087890625, -0.025127410888671875, -0.0115814208984375, 0.001964569091796875, 0.01551055908203125, 0.029056549072265625, 0.0426025390625, 0.056148529052734375, 0.06969451904296875, 0.08324050903320312, 0.0967864990234375, 0.11033248901367188, 0.12387847900390625, 0.13742446899414062, 0.150970458984375, 0.16451644897460938, 0.17806243896484375, 0.19160842895507812, 0.2051544189453125, 0.21870040893554688, 0.23224639892578125, 0.24579238891601562, 0.25933837890625, 0.2728843688964844, 0.28643035888671875, 0.2999763488769531, 0.3135223388671875, 0.3270683288574219, 0.34061431884765625, 0.3541603088378906, 0.367706298828125, 0.3812522888183594, 0.39479827880859375, 0.4083442687988281, 0.4218902587890625, 0.4354362487792969, 0.44898223876953125, 0.4625282287597656, 0.47607421875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 6.0, 8.0, 12.0, 15.0, 23.0, 19.0, 22.0, 53.0, 42.0, 56.0, 77.0, 97.0, 83.0, 93.0, 80.0, 69.0, 60.0, 49.0, 35.0, 26.0, 15.0, 16.0, 11.0, 9.0, 9.0, 5.0, 7.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.367134094238281e-05, -7.12154433131218e-05, -6.875954568386078e-05, -6.630364805459976e-05, -6.384775042533875e-05, -6.139185279607773e-05, -5.893595516681671e-05, -5.6480057537555695e-05, -5.402415990829468e-05, -5.156826227903366e-05, -4.9112364649772644e-05, -4.665646702051163e-05, -4.420056939125061e-05, -4.1744671761989594e-05, -3.928877413272858e-05, -3.683287650346756e-05, -3.437697887420654e-05, -3.1921081244945526e-05, -2.946518361568451e-05, -2.7009285986423492e-05, -2.4553388357162476e-05, -2.209749072790146e-05, -1.9641593098640442e-05, -1.7185695469379425e-05, -1.4729797840118408e-05, -1.2273900210857391e-05, -9.818002581596375e-06, -7.362104952335358e-06, -4.906207323074341e-06, -2.450309693813324e-06, 5.587935447692871e-09, 2.4614855647087097e-06, 4.9173831939697266e-06, 7.373280823230743e-06, 9.82917845249176e-06, 1.2285076081752777e-05, 1.4740973711013794e-05, 1.719687134027481e-05, 1.9652768969535828e-05, 2.2108666598796844e-05, 2.456456422805786e-05, 2.7020461857318878e-05, 2.9476359486579895e-05, 3.193225711584091e-05, 3.438815474510193e-05, 3.6844052374362946e-05, 3.929995000362396e-05, 4.175584763288498e-05, 4.4211745262145996e-05, 4.666764289140701e-05, 4.912354052066803e-05, 5.157943814992905e-05, 5.4035335779190063e-05, 5.649123340845108e-05, 5.89471310377121e-05, 6.140302866697311e-05, 6.385892629623413e-05, 6.631482392549515e-05, 6.877072155475616e-05, 7.122661918401718e-05, 7.36825168132782e-05, 7.613841444253922e-05, 7.859431207180023e-05, 8.105020970106125e-05, 8.350610733032227e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 6.0, 8.0, 13.0, 17.0, 26.0, 51.0, 74.0, 108.0, 206.0, 422.0, 885.0, 2104.0, 6383.0, 31648.0, 257637.0, 625006.0, 102358.0, 14954.0, 3862.0, 1447.0, 640.0, 296.0, 156.0, 96.0, 57.0, 30.0, 23.0, 10.0, 10.0, 7.0, 3.0, 4.0, 4.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4482421875, -0.43181610107421875, -0.4153900146484375, -0.39896392822265625, -0.382537841796875, -0.36611175537109375, -0.3496856689453125, -0.33325958251953125, -0.31683349609375, -0.30040740966796875, -0.2839813232421875, -0.26755523681640625, -0.251129150390625, -0.23470306396484375, -0.2182769775390625, -0.20185089111328125, -0.1854248046875, -0.16899871826171875, -0.1525726318359375, -0.13614654541015625, -0.119720458984375, -0.10329437255859375, -0.0868682861328125, -0.07044219970703125, -0.05401611328125, -0.03759002685546875, -0.0211639404296875, -0.00473785400390625, 0.011688232421875, 0.02811431884765625, 0.0445404052734375, 0.06096649169921875, 0.077392578125, 0.09381866455078125, 0.1102447509765625, 0.12667083740234375, 0.143096923828125, 0.15952301025390625, 0.1759490966796875, 0.19237518310546875, 0.20880126953125, 0.22522735595703125, 0.2416534423828125, 0.25807952880859375, 0.274505615234375, 0.29093170166015625, 0.3073577880859375, 0.32378387451171875, 0.3402099609375, 0.35663604736328125, 0.3730621337890625, 0.38948822021484375, 0.405914306640625, 0.42234039306640625, 0.4387664794921875, 0.45519256591796875, 0.47161865234375, 0.48804473876953125, 0.5044708251953125, 0.5208969116210938, 0.537322998046875, 0.5537490844726562, 0.5701751708984375, 0.5866012573242188, 0.60302734375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 5.0, 3.0, 9.0, 6.0, 17.0, 14.0, 22.0, 27.0, 29.0, 41.0, 45.0, 56.0, 81.0, 84.0, 75.0, 87.0, 80.0, 80.0, 52.0, 48.0, 34.0, 23.0, 23.0, 15.0, 17.0, 9.0, 3.0, 4.0, 5.0, 2.0, 0.0, 2.0, 4.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.37548828125, -0.36331939697265625, -0.3511505126953125, -0.33898162841796875, -0.326812744140625, -0.31464385986328125, -0.3024749755859375, -0.29030609130859375, -0.27813720703125, -0.26596832275390625, -0.2537994384765625, -0.24163055419921875, -0.229461669921875, -0.21729278564453125, -0.2051239013671875, -0.19295501708984375, -0.1807861328125, -0.16861724853515625, -0.1564483642578125, -0.14427947998046875, -0.132110595703125, -0.11994171142578125, -0.1077728271484375, -0.09560394287109375, -0.08343505859375, -0.07126617431640625, -0.0590972900390625, -0.04692840576171875, -0.034759521484375, -0.02259063720703125, -0.0104217529296875, 0.00174713134765625, 0.013916015625, 0.02608489990234375, 0.0382537841796875, 0.05042266845703125, 0.062591552734375, 0.07476043701171875, 0.0869293212890625, 0.09909820556640625, 0.11126708984375, 0.12343597412109375, 0.1356048583984375, 0.14777374267578125, 0.159942626953125, 0.17211151123046875, 0.1842803955078125, 0.19644927978515625, 0.2086181640625, 0.22078704833984375, 0.2329559326171875, 0.24512481689453125, 0.257293701171875, 0.26946258544921875, 0.2816314697265625, 0.29380035400390625, 0.30596923828125, 0.31813812255859375, 0.3303070068359375, 0.34247589111328125, 0.354644775390625, 0.36681365966796875, 0.3789825439453125, 0.39115142822265625, 0.4033203125]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 4.0, 4.0, 14.0, 13.0, 15.0, 31.0, 33.0, 51.0, 51.0, 92.0, 105.0, 117.0, 94.0, 97.0, 81.0, 67.0, 46.0, 35.0, 28.0, 11.0, 10.0, 8.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-8.698837280273438, -8.522096633911133, -8.345356941223145, -8.16861629486084, -7.991876602172852, -7.815136432647705, -7.638396263122559, -7.461655616760254, -7.284915924072266, -7.108175754547119, -6.931435585021973, -6.754695415496826, -6.57795524597168, -6.401215076446533, -6.224474906921387, -6.047734260559082, -5.8709940910339355, -5.694253921508789, -5.517513751983643, -5.340773582458496, -5.16403341293335, -4.987293243408203, -4.810552597045898, -4.63381290435791, -4.4570722579956055, -4.280332088470459, -4.1035919189453125, -3.926851749420166, -3.7501115798950195, -3.573371410369873, -3.3966310024261475, -3.219890832901001, -3.0431504249572754, -2.866410255432129, -2.6896700859069824, -2.512929916381836, -2.3361897468566895, -2.159449577331543, -1.9827091693878174, -1.805968999862671, -1.6292288303375244, -1.452488660812378, -1.2757484912872314, -1.0990082025527954, -0.9222680330276489, -0.7455278635025024, -0.5687875747680664, -0.3920474052429199, -0.21530723571777344, -0.038567036390304565, 0.1381731629371643, 0.31491339206695557, 0.49165356159210205, 0.6683937311172485, 0.8451340198516846, 1.021874189376831, 1.1986143589019775, 1.375354528427124, 1.5520946979522705, 1.7288349866867065, 1.905575156211853, 2.082315444946289, 2.2590556144714355, 2.435795783996582, 2.6125359535217285]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 6.0, 2.0, 4.0, 6.0, 4.0, 7.0, 7.0, 16.0, 12.0, 13.0, 24.0, 26.0, 16.0, 23.0, 38.0, 24.0, 30.0, 42.0, 32.0, 48.0, 41.0, 45.0, 56.0, 49.0, 44.0, 34.0, 44.0, 37.0, 42.0, 36.0, 30.0, 21.0, 21.0, 25.0, 18.0, 15.0, 10.0, 15.0, 15.0, 13.0, 7.0, 6.0, 2.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-5.717818260192871, -5.5656938552856445, -5.413569450378418, -5.261444568634033, -5.109320163726807, -4.95719575881958, -4.805070877075195, -4.652946472167969, -4.500822067260742, -4.348697662353516, -4.196573257446289, -4.044448375701904, -3.8923239707946777, -3.740199565887451, -3.5880749225616455, -3.43595027923584, -3.2838258743286133, -3.1317014694213867, -2.979576826095581, -2.8274521827697754, -2.675327777862549, -2.5232033729553223, -2.3710787296295166, -2.218954086303711, -2.0668296813964844, -1.9147051572799683, -1.7625806331634521, -1.610456109046936, -1.45833158493042, -1.3062070608139038, -1.1540825366973877, -1.0019580125808716, -0.8498339653015137, -0.6977094411849976, -0.5455849170684814, -0.39346039295196533, -0.24133586883544922, -0.0892113447189331, 0.06291317939758301, 0.21503770351409912, 0.36716222763061523, 0.5192867517471313, 0.6714112758636475, 0.8235357999801636, 0.9756603240966797, 1.1277848482131958, 1.279909372329712, 1.432033896446228, 1.5841584205627441, 1.7362829446792603, 1.8884074687957764, 2.040532112121582, 2.1926565170288086, 2.344780921936035, 2.496905565261841, 2.6490302085876465, 2.801154613494873, 2.9532790184020996, 3.1054036617279053, 3.257528305053711, 3.4096527099609375, 3.561777114868164, 3.7139017581939697, 3.8660264015197754, 4.018150806427002]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 7.0, 9.0, 9.0, 22.0, 19.0, 27.0, 42.0, 71.0, 122.0, 173.0, 309.0, 662.0, 1754.0, 6957.0, 82158.0, 4066714.0, 28721.0, 4225.0, 1191.0, 485.0, 238.0, 130.0, 85.0, 52.0, 29.0, 17.0, 14.0, 8.0, 12.0, 5.0, 5.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.46875, -5.3046875, -5.140625, -4.9765625, -4.8125, -4.6484375, -4.484375, -4.3203125, -4.15625, -3.9921875, -3.828125, -3.6640625, -3.5, -3.3359375, -3.171875, -3.0078125, -2.84375, -2.6796875, -2.515625, -2.3515625, -2.1875, -2.0234375, -1.859375, -1.6953125, -1.53125, -1.3671875, -1.203125, -1.0390625, -0.875, -0.7109375, -0.546875, -0.3828125, -0.21875, -0.0546875, 0.109375, 0.2734375, 0.4375, 0.6015625, 0.765625, 0.9296875, 1.09375, 1.2578125, 1.421875, 1.5859375, 1.75, 1.9140625, 2.078125, 2.2421875, 2.40625, 2.5703125, 2.734375, 2.8984375, 3.0625, 3.2265625, 3.390625, 3.5546875, 3.71875, 3.8828125, 4.046875, 4.2109375, 4.375, 4.5390625, 4.703125, 4.8671875, 5.03125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 1.0, 2.0, 5.0, 15.0, 24.0, 37.0, 60.0, 81.0, 117.0, 118.0, 120.0, 96.0, 89.0, 65.0, 66.0, 28.0, 30.0, 10.0, 13.0, 7.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.7236328125, -0.7012786865234375, -0.678924560546875, -0.6565704345703125, -0.63421630859375, -0.6118621826171875, -0.589508056640625, -0.5671539306640625, -0.5447998046875, -0.5224456787109375, -0.500091552734375, -0.4777374267578125, -0.45538330078125, -0.4330291748046875, -0.410675048828125, -0.3883209228515625, -0.365966796875, -0.3436126708984375, -0.321258544921875, -0.2989044189453125, -0.27655029296875, -0.2541961669921875, -0.231842041015625, -0.2094879150390625, -0.1871337890625, -0.1647796630859375, -0.142425537109375, -0.1200714111328125, -0.09771728515625, -0.0753631591796875, -0.053009033203125, -0.0306549072265625, -0.00830078125, 0.0140533447265625, 0.036407470703125, 0.0587615966796875, 0.08111572265625, 0.1034698486328125, 0.125823974609375, 0.1481781005859375, 0.1705322265625, 0.1928863525390625, 0.215240478515625, 0.2375946044921875, 0.25994873046875, 0.2823028564453125, 0.304656982421875, 0.3270111083984375, 0.349365234375, 0.3717193603515625, 0.394073486328125, 0.4164276123046875, 0.43878173828125, 0.4611358642578125, 0.483489990234375, 0.5058441162109375, 0.5281982421875, 0.5505523681640625, 0.572906494140625, 0.5952606201171875, 0.61761474609375, 0.6399688720703125, 0.662322998046875, 0.6846771240234375, 0.70703125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 5.0, 3.0, 13.0, 16.0, 12.0, 22.0, 35.0, 31.0, 47.0, 70.0, 105.0, 113.0, 198.0, 239.0, 377.0, 571.0, 820.0, 1418.0, 2434.0, 5533.0, 16340.0, 83085.0, 3706939.0, 324832.0, 33326.0, 8895.0, 3742.0, 1781.0, 1091.0, 661.0, 436.0, 305.0, 198.0, 156.0, 122.0, 83.0, 65.0, 42.0, 32.0, 27.0, 20.0, 15.0, 8.0, 8.0, 5.0, 3.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.8876953125, -1.8282318115234375, -1.768768310546875, -1.7093048095703125, -1.64984130859375, -1.5903778076171875, -1.530914306640625, -1.4714508056640625, -1.4119873046875, -1.3525238037109375, -1.293060302734375, -1.2335968017578125, -1.17413330078125, -1.1146697998046875, -1.055206298828125, -0.9957427978515625, -0.936279296875, -0.8768157958984375, -0.817352294921875, -0.7578887939453125, -0.69842529296875, -0.6389617919921875, -0.579498291015625, -0.5200347900390625, -0.4605712890625, -0.4011077880859375, -0.341644287109375, -0.2821807861328125, -0.22271728515625, -0.1632537841796875, -0.103790283203125, -0.0443267822265625, 0.01513671875, 0.0746002197265625, 0.134063720703125, 0.1935272216796875, 0.25299072265625, 0.3124542236328125, 0.371917724609375, 0.4313812255859375, 0.4908447265625, 0.5503082275390625, 0.609771728515625, 0.6692352294921875, 0.72869873046875, 0.7881622314453125, 0.847625732421875, 0.9070892333984375, 0.966552734375, 1.0260162353515625, 1.085479736328125, 1.1449432373046875, 1.20440673828125, 1.2638702392578125, 1.323333740234375, 1.3827972412109375, 1.4422607421875, 1.5017242431640625, 1.561187744140625, 1.6206512451171875, 1.68011474609375, 1.7395782470703125, 1.799041748046875, 1.8585052490234375, 1.91796875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 2.0, 8.0, 6.0, 18.0, 22.0, 59.0, 175.0, 2627.0, 889.0, 152.0, 53.0, 25.0, 15.0, 8.0, 2.0, 2.0, 4.0, 6.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.458984375, -1.4171600341796875, -1.375335693359375, -1.3335113525390625, -1.29168701171875, -1.2498626708984375, -1.208038330078125, -1.1662139892578125, -1.1243896484375, -1.0825653076171875, -1.040740966796875, -0.9989166259765625, -0.95709228515625, -0.9152679443359375, -0.873443603515625, -0.8316192626953125, -0.789794921875, -0.7479705810546875, -0.706146240234375, -0.6643218994140625, -0.62249755859375, -0.5806732177734375, -0.538848876953125, -0.4970245361328125, -0.4552001953125, -0.4133758544921875, -0.371551513671875, -0.3297271728515625, -0.28790283203125, -0.2460784912109375, -0.204254150390625, -0.1624298095703125, -0.12060546875, -0.0787811279296875, -0.036956787109375, 0.0048675537109375, 0.04669189453125, 0.0885162353515625, 0.130340576171875, 0.1721649169921875, 0.2139892578125, 0.2558135986328125, 0.297637939453125, 0.3394622802734375, 0.38128662109375, 0.4231109619140625, 0.464935302734375, 0.5067596435546875, 0.548583984375, 0.5904083251953125, 0.632232666015625, 0.6740570068359375, 0.71588134765625, 0.7577056884765625, 0.799530029296875, 0.8413543701171875, 0.8831787109375, 0.9250030517578125, 0.966827392578125, 1.0086517333984375, 1.05047607421875, 1.0923004150390625, 1.134124755859375, 1.1759490966796875, 1.2177734375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 6.0, 4.0, 4.0, 8.0, 25.0, 48.0, 128.0, 226.0, 237.0, 155.0, 91.0, 25.0, 22.0, 13.0, 7.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4178354740142822, -3.2553305625915527, -3.092825412750244, -2.9303205013275146, -2.767815589904785, -2.6053104400634766, -2.442805528640747, -2.2803006172180176, -2.117795467376709, -1.95529043674469, -1.7927855253219604, -1.6302804946899414, -1.467775583267212, -1.3052705526351929, -1.1427655220031738, -0.9802606105804443, -0.8177556991577148, -0.6552507281303406, -0.4927457273006439, -0.33024072647094727, -0.167735755443573, -0.0052307844161987305, 0.1572742462158203, 0.3197791576385498, 0.48228418827056885, 0.6447891592979431, 0.8072941303253174, 0.9697991609573364, 1.1323041915893555, 1.294809103012085, 1.457314133644104, 1.6198190450668335, 1.7823243141174316, 1.9448293447494507, 2.1073343753814697, 2.269839286804199, 2.4323441982269287, 2.594849109649658, 2.757354259490967, 2.9198591709136963, 3.082364082336426, 3.2448689937591553, 3.407374143600464, 3.5698790550231934, 3.732383966445923, 3.8948888778686523, 4.057394027709961, 4.2198991775512695, 4.382404327392578, 4.544909477233887, 4.707414150238037, 4.869919300079346, 5.032424449920654, 5.194929122924805, 5.357434272766113, 5.519939422607422, 5.682444095611572, 5.844949245452881, 6.007453918457031, 6.16995906829834, 6.332464218139648, 6.494968891143799, 6.657474040985107, 6.819978713989258, 6.982483863830566]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 9.0, 12.0, 7.0, 34.0, 40.0, 43.0, 60.0, 63.0, 80.0, 75.0, 91.0, 77.0, 91.0, 90.0, 54.0, 43.0, 38.0, 27.0, 16.0, 12.0, 9.0, 10.0, 5.0, 2.0, 2.0, 5.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.9185948371887207, -3.8101539611816406, -3.7017130851745605, -3.5932722091674805, -3.4848310947418213, -3.376390218734741, -3.267949342727661, -3.159508466720581, -3.051067352294922, -2.942626476287842, -2.8341856002807617, -2.7257447242736816, -2.6173036098480225, -2.5088627338409424, -2.4004218578338623, -2.2919809818267822, -2.183540105819702, -2.075099229812622, -1.9666582345962524, -1.8582173585891724, -1.7497763633728027, -1.6413354873657227, -1.5328946113586426, -1.4244537353515625, -1.3160127401351929, -1.2075718641281128, -1.0991308689117432, -0.9906899929046631, -0.8822490572929382, -0.7738081216812134, -0.6653672456741333, -0.5569263100624084, -0.4484851360321045, -0.34004420042037964, -0.23160329461097717, -0.12316238880157471, -0.014721453189849854, 0.093719482421875, 0.20216035842895508, 0.31060129404067993, 0.4190422296524048, 0.5274831652641296, 0.6359241008758545, 0.7443649768829346, 0.8528059124946594, 0.9612468481063843, 1.0696877241134644, 1.178128719329834, 1.286569595336914, 1.3950104713439941, 1.5034514665603638, 1.6118923425674438, 1.7203333377838135, 1.8287742137908936, 1.9372150897979736, 2.0456559658050537, 2.154097080230713, 2.262537956237793, 2.370978832244873, 2.479419708251953, 2.5878608226776123, 2.6963016986846924, 2.8047425746917725, 2.9131834506988525, 3.0216243267059326]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 4.0, 7.0, 15.0, 18.0, 28.0, 48.0, 86.0, 173.0, 252.0, 495.0, 1006.0, 2052.0, 5512.0, 30889.0, 399416.0, 552925.0, 43886.0, 6976.0, 2405.0, 1074.0, 601.0, 287.0, 161.0, 89.0, 73.0, 36.0, 13.0, 9.0, 5.0, 6.0, 4.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.103515625, -3.000335693359375, -2.89715576171875, -2.793975830078125, -2.6907958984375, -2.587615966796875, -2.48443603515625, -2.381256103515625, -2.278076171875, -2.174896240234375, -2.07171630859375, -1.968536376953125, -1.8653564453125, -1.762176513671875, -1.65899658203125, -1.555816650390625, -1.45263671875, -1.349456787109375, -1.24627685546875, -1.143096923828125, -1.0399169921875, -0.936737060546875, -0.83355712890625, -0.730377197265625, -0.627197265625, -0.524017333984375, -0.42083740234375, -0.317657470703125, -0.2144775390625, -0.111297607421875, -0.00811767578125, 0.095062255859375, 0.1982421875, 0.301422119140625, 0.40460205078125, 0.507781982421875, 0.6109619140625, 0.714141845703125, 0.81732177734375, 0.920501708984375, 1.023681640625, 1.126861572265625, 1.23004150390625, 1.333221435546875, 1.4364013671875, 1.539581298828125, 1.64276123046875, 1.745941162109375, 1.84912109375, 1.952301025390625, 2.05548095703125, 2.158660888671875, 2.2618408203125, 2.365020751953125, 2.46820068359375, 2.571380615234375, 2.674560546875, 2.777740478515625, 2.88092041015625, 2.984100341796875, 3.0872802734375, 3.190460205078125, 3.29364013671875, 3.396820068359375, 3.5]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 11.0, 17.0, 18.0, 53.0, 62.0, 94.0, 129.0, 111.0, 123.0, 84.0, 74.0, 73.0, 45.0, 46.0, 17.0, 15.0, 3.0, 9.0, 1.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.77978515625, -0.7555084228515625, -0.731231689453125, -0.7069549560546875, -0.68267822265625, -0.6584014892578125, -0.634124755859375, -0.6098480224609375, -0.5855712890625, -0.5612945556640625, -0.537017822265625, -0.5127410888671875, -0.48846435546875, -0.4641876220703125, -0.439910888671875, -0.4156341552734375, -0.391357421875, -0.3670806884765625, -0.342803955078125, -0.3185272216796875, -0.29425048828125, -0.2699737548828125, -0.245697021484375, -0.2214202880859375, -0.1971435546875, -0.1728668212890625, -0.148590087890625, -0.1243133544921875, -0.10003662109375, -0.0757598876953125, -0.051483154296875, -0.0272064208984375, -0.0029296875, 0.0213470458984375, 0.045623779296875, 0.0699005126953125, 0.09417724609375, 0.1184539794921875, 0.142730712890625, 0.1670074462890625, 0.1912841796875, 0.2155609130859375, 0.239837646484375, 0.2641143798828125, 0.28839111328125, 0.3126678466796875, 0.336944580078125, 0.3612213134765625, 0.385498046875, 0.4097747802734375, 0.434051513671875, 0.4583282470703125, 0.48260498046875, 0.5068817138671875, 0.531158447265625, 0.5554351806640625, 0.5797119140625, 0.6039886474609375, 0.628265380859375, 0.6525421142578125, 0.67681884765625, 0.7010955810546875, 0.725372314453125, 0.7496490478515625, 0.77392578125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 4.0, 10.0, 7.0, 6.0, 18.0, 23.0, 37.0, 51.0, 72.0, 94.0, 164.0, 249.0, 436.0, 820.0, 1561.0, 3123.0, 7368.0, 18734.0, 56279.0, 181777.0, 408451.0, 248042.0, 78771.0, 25104.0, 9307.0, 3910.0, 1856.0, 913.0, 490.0, 327.0, 196.0, 117.0, 65.0, 60.0, 34.0, 25.0, 20.0, 13.0, 6.0, 5.0, 4.0, 6.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9912109375, -0.9598846435546875, -0.928558349609375, -0.8972320556640625, -0.86590576171875, -0.8345794677734375, -0.803253173828125, -0.7719268798828125, -0.7406005859375, -0.7092742919921875, -0.677947998046875, -0.6466217041015625, -0.61529541015625, -0.5839691162109375, -0.552642822265625, -0.5213165283203125, -0.489990234375, -0.4586639404296875, -0.427337646484375, -0.3960113525390625, -0.36468505859375, -0.3333587646484375, -0.302032470703125, -0.2707061767578125, -0.2393798828125, -0.2080535888671875, -0.176727294921875, -0.1454010009765625, -0.11407470703125, -0.0827484130859375, -0.051422119140625, -0.0200958251953125, 0.01123046875, 0.0425567626953125, 0.073883056640625, 0.1052093505859375, 0.13653564453125, 0.1678619384765625, 0.199188232421875, 0.2305145263671875, 0.2618408203125, 0.2931671142578125, 0.324493408203125, 0.3558197021484375, 0.38714599609375, 0.4184722900390625, 0.449798583984375, 0.4811248779296875, 0.512451171875, 0.5437774658203125, 0.575103759765625, 0.6064300537109375, 0.63775634765625, 0.6690826416015625, 0.700408935546875, 0.7317352294921875, 0.7630615234375, 0.7943878173828125, 0.825714111328125, 0.8570404052734375, 0.88836669921875, 0.9196929931640625, 0.951019287109375, 0.9823455810546875, 1.013671875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 6.0, 2.0, 1.0, 5.0, 9.0, 9.0, 11.0, 9.0, 7.0, 17.0, 17.0, 17.0, 30.0, 36.0, 27.0, 28.0, 49.0, 54.0, 51.0, 63.0, 46.0, 63.0, 58.0, 47.0, 45.0, 49.0, 34.0, 35.0, 32.0, 33.0, 28.0, 16.0, 9.0, 15.0, 14.0, 7.0, 8.0, 6.0, 6.0, 4.0, 1.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.474609375, -1.42730712890625, -1.3800048828125, -1.33270263671875, -1.285400390625, -1.23809814453125, -1.1907958984375, -1.14349365234375, -1.09619140625, -1.04888916015625, -1.0015869140625, -0.95428466796875, -0.906982421875, -0.85968017578125, -0.8123779296875, -0.76507568359375, -0.7177734375, -0.67047119140625, -0.6231689453125, -0.57586669921875, -0.528564453125, -0.48126220703125, -0.4339599609375, -0.38665771484375, -0.33935546875, -0.29205322265625, -0.2447509765625, -0.19744873046875, -0.150146484375, -0.10284423828125, -0.0555419921875, -0.00823974609375, 0.0390625, 0.08636474609375, 0.1336669921875, 0.18096923828125, 0.228271484375, 0.27557373046875, 0.3228759765625, 0.37017822265625, 0.41748046875, 0.46478271484375, 0.5120849609375, 0.55938720703125, 0.606689453125, 0.65399169921875, 0.7012939453125, 0.74859619140625, 0.7958984375, 0.84320068359375, 0.8905029296875, 0.93780517578125, 0.985107421875, 1.03240966796875, 1.0797119140625, 1.12701416015625, 1.17431640625, 1.22161865234375, 1.2689208984375, 1.31622314453125, 1.363525390625, 1.41082763671875, 1.4581298828125, 1.50543212890625, 1.552734375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 3.0, 7.0, 18.0, 34.0, 61.0, 146.0, 379.0, 1474.0, 11004.0, 594144.0, 430626.0, 8683.0, 1307.0, 406.0, 147.0, 54.0, 34.0, 12.0, 4.0, 2.0, 1.0, 1.0, 2.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.048828125, -2.0, -1.951171875, -1.90234375, -1.853515625, -1.8046875, -1.755859375, -1.70703125, -1.658203125, -1.609375, -1.560546875, -1.51171875, -1.462890625, -1.4140625, -1.365234375, -1.31640625, -1.267578125, -1.21875, -1.169921875, -1.12109375, -1.072265625, -1.0234375, -0.974609375, -0.92578125, -0.876953125, -0.828125, -0.779296875, -0.73046875, -0.681640625, -0.6328125, -0.583984375, -0.53515625, -0.486328125, -0.4375, -0.388671875, -0.33984375, -0.291015625, -0.2421875, -0.193359375, -0.14453125, -0.095703125, -0.046875, 0.001953125, 0.05078125, 0.099609375, 0.1484375, 0.197265625, 0.24609375, 0.294921875, 0.34375, 0.392578125, 0.44140625, 0.490234375, 0.5390625, 0.587890625, 0.63671875, 0.685546875, 0.734375, 0.783203125, 0.83203125, 0.880859375, 0.9296875, 0.978515625, 1.02734375, 1.076171875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 5.0, 2.0, 4.0, 9.0, 15.0, 14.0, 31.0, 46.0, 75.0, 120.0, 139.0, 162.0, 129.0, 97.0, 58.0, 41.0, 21.0, 13.0, 8.0, 5.0, 8.0, 3.0, 0.0, 2.0, 3.0, 2.0, 1.0], "bins": [-0.00021147727966308594, -0.0002070888876914978, -0.00020270049571990967, -0.00019831210374832153, -0.0001939237117767334, -0.00018953531980514526, -0.00018514692783355713, -0.000180758535861969, -0.00017637014389038086, -0.00017198175191879272, -0.0001675933599472046, -0.00016320496797561646, -0.00015881657600402832, -0.00015442818403244019, -0.00015003979206085205, -0.00014565140008926392, -0.00014126300811767578, -0.00013687461614608765, -0.0001324862241744995, -0.00012809783220291138, -0.00012370944023132324, -0.00011932104825973511, -0.00011493265628814697, -0.00011054426431655884, -0.0001061558723449707, -0.00010176748037338257, -9.737908840179443e-05, -9.29906964302063e-05, -8.860230445861816e-05, -8.421391248703003e-05, -7.98255205154419e-05, -7.543712854385376e-05, -7.104873657226562e-05, -6.666034460067749e-05, -6.227195262908936e-05, -5.788356065750122e-05, -5.3495168685913086e-05, -4.910677671432495e-05, -4.4718384742736816e-05, -4.032999277114868e-05, -3.594160079956055e-05, -3.155320882797241e-05, -2.7164816856384277e-05, -2.2776424884796143e-05, -1.8388032913208008e-05, -1.3999640941619873e-05, -9.611248970031738e-06, -5.2228569984436035e-06, -8.344650268554688e-07, 3.553926944732666e-06, 7.9423189163208e-06, 1.2330710887908936e-05, 1.671910285949707e-05, 2.1107494831085205e-05, 2.549588680267334e-05, 2.9884278774261475e-05, 3.427267074584961e-05, 3.8661062717437744e-05, 4.304945468902588e-05, 4.7437846660614014e-05, 5.182623863220215e-05, 5.621463060379028e-05, 6.060302257537842e-05, 6.499141454696655e-05, 6.937980651855469e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 6.0, 11.0, 9.0, 18.0, 37.0, 37.0, 77.0, 159.0, 360.0, 1071.0, 3927.0, 21570.0, 225159.0, 702962.0, 79484.0, 10226.0, 2212.0, 684.0, 249.0, 114.0, 69.0, 36.0, 23.0, 21.0, 13.0, 10.0, 8.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.77099609375, -0.7437515258789062, -0.7165069580078125, -0.6892623901367188, -0.662017822265625, -0.6347732543945312, -0.6075286865234375, -0.5802841186523438, -0.55303955078125, -0.5257949829101562, -0.4985504150390625, -0.47130584716796875, -0.444061279296875, -0.41681671142578125, -0.3895721435546875, -0.36232757568359375, -0.3350830078125, -0.30783843994140625, -0.2805938720703125, -0.25334930419921875, -0.226104736328125, -0.19886016845703125, -0.1716156005859375, -0.14437103271484375, -0.11712646484375, -0.08988189697265625, -0.0626373291015625, -0.03539276123046875, -0.008148193359375, 0.01909637451171875, 0.0463409423828125, 0.07358551025390625, 0.100830078125, 0.12807464599609375, 0.1553192138671875, 0.18256378173828125, 0.209808349609375, 0.23705291748046875, 0.2642974853515625, 0.29154205322265625, 0.31878662109375, 0.34603118896484375, 0.3732757568359375, 0.40052032470703125, 0.427764892578125, 0.45500946044921875, 0.4822540283203125, 0.5094985961914062, 0.5367431640625, 0.5639877319335938, 0.5912322998046875, 0.6184768676757812, 0.645721435546875, 0.6729660034179688, 0.7002105712890625, 0.7274551391601562, 0.75469970703125, 0.7819442749023438, 0.8091888427734375, 0.8364334106445312, 0.863677978515625, 0.8909225463867188, 0.9181671142578125, 0.9454116821289062, 0.97265625]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 7.0, 13.0, 23.0, 21.0, 31.0, 56.0, 74.0, 112.0, 156.0, 132.0, 112.0, 90.0, 54.0, 46.0, 16.0, 18.0, 13.0, 12.0, 3.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2978515625, -1.268402099609375, -1.23895263671875, -1.209503173828125, -1.1800537109375, -1.150604248046875, -1.12115478515625, -1.091705322265625, -1.062255859375, -1.032806396484375, -1.00335693359375, -0.973907470703125, -0.9444580078125, -0.915008544921875, -0.88555908203125, -0.856109619140625, -0.82666015625, -0.797210693359375, -0.76776123046875, -0.738311767578125, -0.7088623046875, -0.679412841796875, -0.64996337890625, -0.620513916015625, -0.591064453125, -0.561614990234375, -0.53216552734375, -0.502716064453125, -0.4732666015625, -0.443817138671875, -0.41436767578125, -0.384918212890625, -0.35546875, -0.326019287109375, -0.29656982421875, -0.267120361328125, -0.2376708984375, -0.208221435546875, -0.17877197265625, -0.149322509765625, -0.119873046875, -0.090423583984375, -0.06097412109375, -0.031524658203125, -0.0020751953125, 0.027374267578125, 0.05682373046875, 0.086273193359375, 0.11572265625, 0.145172119140625, 0.17462158203125, 0.204071044921875, 0.2335205078125, 0.262969970703125, 0.29241943359375, 0.321868896484375, 0.351318359375, 0.380767822265625, 0.41021728515625, 0.439666748046875, 0.4691162109375, 0.498565673828125, 0.52801513671875, 0.557464599609375, 0.5869140625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 14.0, 31.0, 98.0, 293.0, 369.0, 149.0, 45.0, 8.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-48.15915298461914, -47.269290924072266, -46.379432678222656, -45.48957061767578, -44.59971237182617, -43.7098503112793, -42.81999206542969, -41.93013000488281, -41.04026794433594, -40.15040588378906, -39.26054763793945, -38.37068557739258, -37.48082733154297, -36.590965270996094, -35.701107025146484, -34.81124496459961, -33.92138671875, -33.031524658203125, -32.141666412353516, -31.251806259155273, -30.36194610595703, -29.472084045410156, -28.582223892211914, -27.692363739013672, -26.80250358581543, -25.912643432617188, -25.022783279418945, -24.132923126220703, -23.243061065673828, -22.35320281982422, -21.463340759277344, -20.5734806060791, -19.683622360229492, -18.79376220703125, -17.903902053833008, -17.014041900634766, -16.12417984008789, -15.234320640563965, -14.344459533691406, -13.454599380493164, -12.564739227294922, -11.67487907409668, -10.785018920898438, -9.895157814025879, -9.005297660827637, -8.115437507629395, -7.225576877593994, -6.335716247558594, -5.445856094360352, -4.555995941162109, -3.666135311126709, -2.7762749195098877, -1.8864145278930664, -0.9965543746948242, -0.10669374465942383, 0.7831668853759766, 1.6730270385742188, 2.56288743019104, 3.4527478218078613, 4.342608451843262, 5.232468605041504, 6.122328758239746, 7.0121893882751465, 7.902050018310547, 8.791910171508789]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 1.0, 2.0, 4.0, 2.0, 6.0, 5.0, 7.0, 5.0, 9.0, 15.0, 12.0, 18.0, 19.0, 17.0, 17.0, 25.0, 26.0, 21.0, 31.0, 35.0, 44.0, 41.0, 37.0, 32.0, 42.0, 42.0, 40.0, 45.0, 44.0, 37.0, 35.0, 39.0, 36.0, 30.0, 26.0, 22.0, 20.0, 16.0, 16.0, 12.0, 18.0, 11.0, 7.0, 6.0, 8.0, 6.0, 4.0, 4.0, 2.0, 5.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 2.0], "bins": [-7.000665187835693, -6.785818099975586, -6.5709710121154785, -6.356123924255371, -6.141276836395264, -5.926429748535156, -5.711583137512207, -5.4967360496521, -5.281888961791992, -5.067041873931885, -4.852194786071777, -4.63734769821167, -4.4225006103515625, -4.207653999328613, -3.9928066730499268, -3.7779598236083984, -3.563112497329712, -3.3482654094696045, -3.133418321609497, -2.9185714721679688, -2.7037243843078613, -2.488877296447754, -2.2740302085876465, -2.059183120727539, -1.8443361520767212, -1.6294890642166138, -1.414642095565796, -1.1997950077056885, -0.9849479794502258, -0.7701009511947632, -0.5552538633346558, -0.3404068946838379, -0.12555980682373047, 0.08928723633289337, 0.3041342794895172, 0.5189813375473022, 0.7338283658027649, 0.9486753940582275, 1.163522481918335, 1.3783694505691528, 1.5932165384292603, 1.8080636262893677, 2.0229105949401855, 2.237757682800293, 2.4526047706604004, 2.667451858520508, 2.8822989463806152, 3.0971457958221436, 3.311992883682251, 3.5268399715423584, 3.741687059402466, 3.956533908843994, 4.171380996704102, 4.386228084564209, 4.601075172424316, 4.815922260284424, 5.030769348144531, 5.245616436004639, 5.460463523864746, 5.6753106117248535, 5.890157699584961, 6.10500431060791, 6.319851875305176, 6.534698486328125, 6.749545574188232]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 1.0, 4.0, 4.0, 6.0, 7.0, 11.0, 6.0, 12.0, 20.0, 19.0, 35.0, 31.0, 54.0, 48.0, 65.0, 115.0, 144.0, 207.0, 365.0, 538.0, 956.0, 1705.0, 3611.0, 9285.0, 32687.0, 319047.0, 3720014.0, 76978.0, 16842.0, 5734.0, 2516.0, 1225.0, 695.0, 417.0, 276.0, 183.0, 112.0, 77.0, 61.0, 38.0, 34.0, 26.0, 13.0, 15.0, 12.0, 12.0, 10.0, 3.0, 3.0, 4.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-2.76953125, -2.68621826171875, -2.6029052734375, -2.51959228515625, -2.436279296875, -2.35296630859375, -2.2696533203125, -2.18634033203125, -2.10302734375, -2.01971435546875, -1.9364013671875, -1.85308837890625, -1.769775390625, -1.68646240234375, -1.6031494140625, -1.51983642578125, -1.4365234375, -1.35321044921875, -1.2698974609375, -1.18658447265625, -1.103271484375, -1.01995849609375, -0.9366455078125, -0.85333251953125, -0.77001953125, -0.68670654296875, -0.6033935546875, -0.52008056640625, -0.436767578125, -0.35345458984375, -0.2701416015625, -0.18682861328125, -0.103515625, -0.02020263671875, 0.0631103515625, 0.14642333984375, 0.229736328125, 0.31304931640625, 0.3963623046875, 0.47967529296875, 0.56298828125, 0.64630126953125, 0.7296142578125, 0.81292724609375, 0.896240234375, 0.97955322265625, 1.0628662109375, 1.14617919921875, 1.2294921875, 1.31280517578125, 1.3961181640625, 1.47943115234375, 1.562744140625, 1.64605712890625, 1.7293701171875, 1.81268310546875, 1.89599609375, 1.97930908203125, 2.0626220703125, 2.14593505859375, 2.229248046875, 2.31256103515625, 2.3958740234375, 2.47918701171875, 2.5625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 5.0, 3.0, 2.0, 4.0, 9.0, 13.0, 20.0, 29.0, 52.0, 68.0, 79.0, 100.0, 100.0, 102.0, 94.0, 84.0, 69.0, 40.0, 47.0, 22.0, 24.0, 14.0, 11.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.7890625, -0.7645950317382812, -0.7401275634765625, -0.7156600952148438, -0.691192626953125, -0.6667251586914062, -0.6422576904296875, -0.6177902221679688, -0.59332275390625, -0.5688552856445312, -0.5443878173828125, -0.5199203491210938, -0.495452880859375, -0.47098541259765625, -0.4465179443359375, -0.42205047607421875, -0.3975830078125, -0.37311553955078125, -0.3486480712890625, -0.32418060302734375, -0.299713134765625, -0.27524566650390625, -0.2507781982421875, -0.22631072998046875, -0.20184326171875, -0.17737579345703125, -0.1529083251953125, -0.12844085693359375, -0.103973388671875, -0.07950592041015625, -0.0550384521484375, -0.03057098388671875, -0.006103515625, 0.01836395263671875, 0.0428314208984375, 0.06729888916015625, 0.091766357421875, 0.11623382568359375, 0.1407012939453125, 0.16516876220703125, 0.18963623046875, 0.21410369873046875, 0.2385711669921875, 0.26303863525390625, 0.287506103515625, 0.31197357177734375, 0.3364410400390625, 0.36090850830078125, 0.3853759765625, 0.40984344482421875, 0.4343109130859375, 0.45877838134765625, 0.483245849609375, 0.5077133178710938, 0.5321807861328125, 0.5566482543945312, 0.58111572265625, 0.6055831909179688, 0.6300506591796875, 0.6545181274414062, 0.678985595703125, 0.7034530639648438, 0.7279205322265625, 0.7523880004882812, 0.77685546875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 7.0, 3.0, 11.0, 14.0, 33.0, 29.0, 41.0, 69.0, 95.0, 115.0, 203.0, 253.0, 423.0, 620.0, 1083.0, 2448.0, 7586.0, 37593.0, 1162235.0, 2922803.0, 44487.0, 8354.0, 2622.0, 1163.0, 702.0, 421.0, 277.0, 181.0, 140.0, 88.0, 56.0, 35.0, 20.0, 27.0, 20.0, 10.0, 9.0, 7.0, 3.0, 1.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.9453125, -2.86358642578125, -2.7818603515625, -2.70013427734375, -2.618408203125, -2.53668212890625, -2.4549560546875, -2.37322998046875, -2.29150390625, -2.20977783203125, -2.1280517578125, -2.04632568359375, -1.964599609375, -1.88287353515625, -1.8011474609375, -1.71942138671875, -1.6376953125, -1.55596923828125, -1.4742431640625, -1.39251708984375, -1.310791015625, -1.22906494140625, -1.1473388671875, -1.06561279296875, -0.98388671875, -0.90216064453125, -0.8204345703125, -0.73870849609375, -0.656982421875, -0.57525634765625, -0.4935302734375, -0.41180419921875, -0.330078125, -0.24835205078125, -0.1666259765625, -0.08489990234375, -0.003173828125, 0.07855224609375, 0.1602783203125, 0.24200439453125, 0.32373046875, 0.40545654296875, 0.4871826171875, 0.56890869140625, 0.650634765625, 0.73236083984375, 0.8140869140625, 0.89581298828125, 0.9775390625, 1.05926513671875, 1.1409912109375, 1.22271728515625, 1.304443359375, 1.38616943359375, 1.4678955078125, 1.54962158203125, 1.63134765625, 1.71307373046875, 1.7947998046875, 1.87652587890625, 1.958251953125, 2.03997802734375, 2.1217041015625, 2.20343017578125, 2.28515625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 8.0, 12.0, 26.0, 59.0, 172.0, 1556.0, 1921.0, 188.0, 59.0, 31.0, 18.0, 9.0, 5.0, 7.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6533203125, -1.5897674560546875, -1.526214599609375, -1.4626617431640625, -1.39910888671875, -1.3355560302734375, -1.272003173828125, -1.2084503173828125, -1.1448974609375, -1.0813446044921875, -1.017791748046875, -0.9542388916015625, -0.89068603515625, -0.8271331787109375, -0.763580322265625, -0.7000274658203125, -0.636474609375, -0.5729217529296875, -0.509368896484375, -0.4458160400390625, -0.38226318359375, -0.3187103271484375, -0.255157470703125, -0.1916046142578125, -0.1280517578125, -0.0644989013671875, -0.000946044921875, 0.0626068115234375, 0.12615966796875, 0.1897125244140625, 0.253265380859375, 0.3168182373046875, 0.38037109375, 0.4439239501953125, 0.507476806640625, 0.5710296630859375, 0.63458251953125, 0.6981353759765625, 0.761688232421875, 0.8252410888671875, 0.8887939453125, 0.9523468017578125, 1.015899658203125, 1.0794525146484375, 1.14300537109375, 1.2065582275390625, 1.270111083984375, 1.3336639404296875, 1.397216796875, 1.4607696533203125, 1.524322509765625, 1.5878753662109375, 1.65142822265625, 1.7149810791015625, 1.778533935546875, 1.8420867919921875, 1.9056396484375, 1.9691925048828125, 2.032745361328125, 2.0962982177734375, 2.15985107421875, 2.2234039306640625, 2.286956787109375, 2.3505096435546875, 2.4140625]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 9.0, 9.0, 15.0, 27.0, 47.0, 90.0, 128.0, 176.0, 181.0, 117.0, 104.0, 38.0, 27.0, 9.0, 9.0, 3.0, 2.0, 2.0, 4.0, 3.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.853998184204102, -6.669008731842041, -6.484019756317139, -6.299030303955078, -6.114041328430176, -5.929051876068115, -5.744062423706055, -5.559073448181152, -5.374083995819092, -5.189094543457031, -5.004105567932129, -4.819116115570068, -4.634126663208008, -4.4491376876831055, -4.264148235321045, -4.079158782958984, -3.894169807434082, -3.7091805934906006, -3.524191379547119, -3.3392019271850586, -3.154212713241577, -2.9692234992980957, -2.784234046936035, -2.5992448329925537, -2.4142556190490723, -2.229266405105591, -2.0442771911621094, -1.8592877388000488, -1.6742985248565674, -1.489309310913086, -1.304319977760315, -1.119330644607544, -0.9343414306640625, -0.7493521571159363, -0.5643628835678101, -0.37937361001968384, -0.19438433647155762, -0.009395062923431396, 0.17559421062469482, 0.3605835437774658, 0.5455727577209473, 0.7305620312690735, 0.9155513048171997, 1.1005406379699707, 1.2855298519134521, 1.4705190658569336, 1.6555083990097046, 1.8404977321624756, 2.025486946105957, 2.2104761600494385, 2.39546537399292, 2.5804548263549805, 2.765444040298462, 2.9504332542419434, 3.135422706604004, 3.3204119205474854, 3.505401134490967, 3.6903903484344482, 3.8753795623779297, 4.06036901473999, 4.245358467102051, 4.430347442626953, 4.615336894989014, 4.800326347351074, 4.985315322875977]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 5.0, 2.0, 9.0, 9.0, 12.0, 16.0, 33.0, 42.0, 51.0, 53.0, 66.0, 81.0, 76.0, 77.0, 96.0, 64.0, 73.0, 50.0, 53.0, 41.0, 24.0, 18.0, 21.0, 6.0, 8.0, 9.0, 5.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.932065963745117, -3.772571563720703, -3.613077163696289, -3.453583002090454, -3.29408860206604, -3.134594202041626, -2.975100040435791, -2.815605640411377, -2.656111240386963, -2.496616840362549, -2.3371224403381348, -2.1776282787323, -2.0181338787078857, -1.8586394786834717, -1.6991451978683472, -1.5396509170532227, -1.3801565170288086, -1.2206621170043945, -1.06116783618927, -0.9016734957695007, -0.7421791553497314, -0.5826848149299622, -0.42319047451019287, -0.26369619369506836, -0.1042017936706543, 0.05529254674911499, 0.21478688716888428, 0.37428122758865356, 0.5337755680084229, 0.6932699084281921, 0.8527642488479614, 1.012258529663086, 1.1717529296875, 1.331247329711914, 1.4907416105270386, 1.650235891342163, 1.8097302913665771, 1.9692246913909912, 2.128718852996826, 2.2882132530212402, 2.4477076530456543, 2.6072020530700684, 2.7666964530944824, 2.9261906147003174, 3.0856850147247314, 3.2451794147491455, 3.4046735763549805, 3.5641679763793945, 3.7236623764038086, 3.8831567764282227, 4.042651176452637, 4.202145576477051, 4.361639976501465, 4.521133899688721, 4.680628299713135, 4.840122699737549, 4.999617099761963, 5.159111499786377, 5.318605899810791, 5.478100299835205, 5.637594223022461, 5.797088623046875, 5.956583023071289, 6.116077423095703, 6.275571823120117]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 5.0, 4.0, 8.0, 4.0, 14.0, 16.0, 27.0, 26.0, 49.0, 78.0, 93.0, 127.0, 160.0, 237.0, 398.0, 621.0, 1058.0, 1722.0, 3652.0, 8466.0, 24708.0, 91722.0, 357865.0, 400129.0, 110030.0, 28707.0, 9585.0, 3978.0, 1957.0, 1104.0, 664.0, 367.0, 312.0, 203.0, 130.0, 101.0, 62.0, 34.0, 36.0, 28.0, 14.0, 18.0, 13.0, 7.0, 4.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0], "bins": [-2.005859375, -1.94329833984375, -1.8807373046875, -1.81817626953125, -1.755615234375, -1.69305419921875, -1.6304931640625, -1.56793212890625, -1.50537109375, -1.44281005859375, -1.3802490234375, -1.31768798828125, -1.255126953125, -1.19256591796875, -1.1300048828125, -1.06744384765625, -1.0048828125, -0.94232177734375, -0.8797607421875, -0.81719970703125, -0.754638671875, -0.69207763671875, -0.6295166015625, -0.56695556640625, -0.50439453125, -0.44183349609375, -0.3792724609375, -0.31671142578125, -0.254150390625, -0.19158935546875, -0.1290283203125, -0.06646728515625, -0.00390625, 0.05865478515625, 0.1212158203125, 0.18377685546875, 0.246337890625, 0.30889892578125, 0.3714599609375, 0.43402099609375, 0.49658203125, 0.55914306640625, 0.6217041015625, 0.68426513671875, 0.746826171875, 0.80938720703125, 0.8719482421875, 0.93450927734375, 0.9970703125, 1.05963134765625, 1.1221923828125, 1.18475341796875, 1.247314453125, 1.30987548828125, 1.3724365234375, 1.43499755859375, 1.49755859375, 1.56011962890625, 1.6226806640625, 1.68524169921875, 1.747802734375, 1.81036376953125, 1.8729248046875, 1.93548583984375, 1.998046875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 7.0, 4.0, 6.0, 16.0, 27.0, 32.0, 50.0, 65.0, 89.0, 106.0, 98.0, 106.0, 94.0, 81.0, 69.0, 39.0, 32.0, 27.0, 19.0, 8.0, 10.0, 4.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.81103515625, -0.783966064453125, -0.75689697265625, -0.729827880859375, -0.7027587890625, -0.675689697265625, -0.64862060546875, -0.621551513671875, -0.594482421875, -0.567413330078125, -0.54034423828125, -0.513275146484375, -0.4862060546875, -0.459136962890625, -0.43206787109375, -0.404998779296875, -0.3779296875, -0.350860595703125, -0.32379150390625, -0.296722412109375, -0.2696533203125, -0.242584228515625, -0.21551513671875, -0.188446044921875, -0.161376953125, -0.134307861328125, -0.10723876953125, -0.080169677734375, -0.0531005859375, -0.026031494140625, 0.00103759765625, 0.028106689453125, 0.05517578125, 0.082244873046875, 0.10931396484375, 0.136383056640625, 0.1634521484375, 0.190521240234375, 0.21759033203125, 0.244659423828125, 0.271728515625, 0.298797607421875, 0.32586669921875, 0.352935791015625, 0.3800048828125, 0.407073974609375, 0.43414306640625, 0.461212158203125, 0.48828125, 0.515350341796875, 0.54241943359375, 0.569488525390625, 0.5965576171875, 0.623626708984375, 0.65069580078125, 0.677764892578125, 0.704833984375, 0.731903076171875, 0.75897216796875, 0.786041259765625, 0.8131103515625, 0.840179443359375, 0.86724853515625, 0.894317626953125, 0.92138671875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 2.0, 3.0, 4.0, 3.0, 12.0, 26.0, 22.0, 33.0, 50.0, 105.0, 155.0, 259.0, 433.0, 820.0, 1670.0, 3509.0, 8394.0, 21835.0, 67962.0, 247397.0, 454936.0, 165859.0, 47052.0, 16078.0, 6304.0, 2744.0, 1260.0, 647.0, 350.0, 222.0, 113.0, 95.0, 53.0, 49.0, 30.0, 24.0, 16.0, 11.0, 6.0, 0.0, 6.0, 3.0, 4.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4736328125, -1.4266204833984375, -1.379608154296875, -1.3325958251953125, -1.28558349609375, -1.2385711669921875, -1.191558837890625, -1.1445465087890625, -1.0975341796875, -1.0505218505859375, -1.003509521484375, -0.9564971923828125, -0.90948486328125, -0.8624725341796875, -0.815460205078125, -0.7684478759765625, -0.721435546875, -0.6744232177734375, -0.627410888671875, -0.5803985595703125, -0.53338623046875, -0.4863739013671875, -0.439361572265625, -0.3923492431640625, -0.3453369140625, -0.2983245849609375, -0.251312255859375, -0.2042999267578125, -0.15728759765625, -0.1102752685546875, -0.063262939453125, -0.0162506103515625, 0.03076171875, 0.0777740478515625, 0.124786376953125, 0.1717987060546875, 0.21881103515625, 0.2658233642578125, 0.312835693359375, 0.3598480224609375, 0.4068603515625, 0.4538726806640625, 0.500885009765625, 0.5478973388671875, 0.59490966796875, 0.6419219970703125, 0.688934326171875, 0.7359466552734375, 0.782958984375, 0.8299713134765625, 0.876983642578125, 0.9239959716796875, 0.97100830078125, 1.0180206298828125, 1.065032958984375, 1.1120452880859375, 1.1590576171875, 1.2060699462890625, 1.253082275390625, 1.3000946044921875, 1.34710693359375, 1.3941192626953125, 1.441131591796875, 1.4881439208984375, 1.53515625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 8.0, 8.0, 9.0, 12.0, 16.0, 27.0, 34.0, 35.0, 28.0, 56.0, 56.0, 74.0, 70.0, 60.0, 67.0, 69.0, 70.0, 59.0, 50.0, 37.0, 25.0, 26.0, 30.0, 21.0, 15.0, 9.0, 6.0, 8.0, 3.0, 4.0, 4.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-3.294921875, -3.21002197265625, -3.1251220703125, -3.04022216796875, -2.955322265625, -2.87042236328125, -2.7855224609375, -2.70062255859375, -2.61572265625, -2.53082275390625, -2.4459228515625, -2.36102294921875, -2.276123046875, -2.19122314453125, -2.1063232421875, -2.02142333984375, -1.9365234375, -1.85162353515625, -1.7667236328125, -1.68182373046875, -1.596923828125, -1.51202392578125, -1.4271240234375, -1.34222412109375, -1.25732421875, -1.17242431640625, -1.0875244140625, -1.00262451171875, -0.917724609375, -0.83282470703125, -0.7479248046875, -0.66302490234375, -0.578125, -0.49322509765625, -0.4083251953125, -0.32342529296875, -0.238525390625, -0.15362548828125, -0.0687255859375, 0.01617431640625, 0.10107421875, 0.18597412109375, 0.2708740234375, 0.35577392578125, 0.440673828125, 0.52557373046875, 0.6104736328125, 0.69537353515625, 0.7802734375, 0.86517333984375, 0.9500732421875, 1.03497314453125, 1.119873046875, 1.20477294921875, 1.2896728515625, 1.37457275390625, 1.45947265625, 1.54437255859375, 1.6292724609375, 1.71417236328125, 1.799072265625, 1.88397216796875, 1.9688720703125, 2.05377197265625, 2.138671875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 5.0, 6.0, 8.0, 15.0, 19.0, 41.0, 58.0, 92.0, 187.0, 365.0, 718.0, 1976.0, 6228.0, 28617.0, 258445.0, 654641.0, 78747.0, 12883.0, 3266.0, 1097.0, 551.0, 239.0, 154.0, 83.0, 43.0, 33.0, 18.0, 12.0, 6.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1650390625, -1.1300048828125, -1.094970703125, -1.0599365234375, -1.02490234375, -0.9898681640625, -0.954833984375, -0.9197998046875, -0.884765625, -0.8497314453125, -0.814697265625, -0.7796630859375, -0.74462890625, -0.7095947265625, -0.674560546875, -0.6395263671875, -0.6044921875, -0.5694580078125, -0.534423828125, -0.4993896484375, -0.46435546875, -0.4293212890625, -0.394287109375, -0.3592529296875, -0.32421875, -0.2891845703125, -0.254150390625, -0.2191162109375, -0.18408203125, -0.1490478515625, -0.114013671875, -0.0789794921875, -0.0439453125, -0.0089111328125, 0.026123046875, 0.0611572265625, 0.09619140625, 0.1312255859375, 0.166259765625, 0.2012939453125, 0.236328125, 0.2713623046875, 0.306396484375, 0.3414306640625, 0.37646484375, 0.4114990234375, 0.446533203125, 0.4815673828125, 0.5166015625, 0.5516357421875, 0.586669921875, 0.6217041015625, 0.65673828125, 0.6917724609375, 0.726806640625, 0.7618408203125, 0.796875, 0.8319091796875, 0.866943359375, 0.9019775390625, 0.93701171875, 0.9720458984375, 1.007080078125, 1.0421142578125, 1.0771484375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 4.0, 7.0, 12.0, 12.0, 27.0, 37.0, 65.0, 93.0, 143.0, 159.0, 175.0, 110.0, 62.0, 32.0, 27.0, 18.0, 17.0, 6.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.28640365600586e-05, -8.605979382991791e-05, -7.925555109977722e-05, -7.245130836963654e-05, -6.564706563949585e-05, -5.8842822909355164e-05, -5.203858017921448e-05, -4.523433744907379e-05, -3.8430094718933105e-05, -3.162585198879242e-05, -2.4821609258651733e-05, -1.8017366528511047e-05, -1.1213123798370361e-05, -4.408881068229675e-06, 2.3953616619110107e-06, 9.199604392051697e-06, 1.6003847122192383e-05, 2.280808985233307e-05, 2.9612332582473755e-05, 3.641657531261444e-05, 4.322081804275513e-05, 5.002506077289581e-05, 5.68293035030365e-05, 6.363354623317719e-05, 7.043778896331787e-05, 7.724203169345856e-05, 8.404627442359924e-05, 9.085051715373993e-05, 9.765475988388062e-05, 0.0001044590026140213, 0.00011126324534416199, 0.00011806748807430267, 0.00012487173080444336, 0.00013167597353458405, 0.00013848021626472473, 0.00014528445899486542, 0.0001520887017250061, 0.0001588929444551468, 0.00016569718718528748, 0.00017250142991542816, 0.00017930567264556885, 0.00018610991537570953, 0.00019291415810585022, 0.0001997184008359909, 0.0002065226435661316, 0.00021332688629627228, 0.00022013112902641296, 0.00022693537175655365, 0.00023373961448669434, 0.00024054385721683502, 0.0002473480999469757, 0.0002541523426771164, 0.0002609565854072571, 0.00026776082813739777, 0.00027456507086753845, 0.00028136931359767914, 0.0002881735563278198, 0.0002949777990579605, 0.0003017820417881012, 0.0003085862845182419, 0.00031539052724838257, 0.00032219476997852325, 0.00032899901270866394, 0.0003358032554388046, 0.0003426074981689453]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 4.0, 2.0, 6.0, 5.0, 7.0, 17.0, 17.0, 42.0, 48.0, 86.0, 96.0, 223.0, 318.0, 632.0, 1130.0, 2466.0, 6266.0, 19539.0, 81246.0, 387271.0, 423959.0, 91758.0, 21123.0, 6722.0, 2758.0, 1289.0, 612.0, 379.0, 198.0, 136.0, 64.0, 59.0, 30.0, 23.0, 12.0, 3.0, 3.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.62255859375, -0.5995330810546875, -0.576507568359375, -0.5534820556640625, -0.53045654296875, -0.5074310302734375, -0.484405517578125, -0.4613800048828125, -0.4383544921875, -0.4153289794921875, -0.392303466796875, -0.3692779541015625, -0.34625244140625, -0.3232269287109375, -0.300201416015625, -0.2771759033203125, -0.254150390625, -0.2311248779296875, -0.208099365234375, -0.1850738525390625, -0.16204833984375, -0.1390228271484375, -0.115997314453125, -0.0929718017578125, -0.0699462890625, -0.0469207763671875, -0.023895263671875, -0.0008697509765625, 0.02215576171875, 0.0451812744140625, 0.068206787109375, 0.0912322998046875, 0.1142578125, 0.1372833251953125, 0.160308837890625, 0.1833343505859375, 0.20635986328125, 0.2293853759765625, 0.252410888671875, 0.2754364013671875, 0.2984619140625, 0.3214874267578125, 0.344512939453125, 0.3675384521484375, 0.39056396484375, 0.4135894775390625, 0.436614990234375, 0.4596405029296875, 0.482666015625, 0.5056915283203125, 0.528717041015625, 0.5517425537109375, 0.57476806640625, 0.5977935791015625, 0.620819091796875, 0.6438446044921875, 0.6668701171875, 0.6898956298828125, 0.712921142578125, 0.7359466552734375, 0.75897216796875, 0.7819976806640625, 0.805023193359375, 0.8280487060546875, 0.85107421875]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 6.0, 1.0, 2.0, 2.0, 5.0, 7.0, 11.0, 11.0, 17.0, 16.0, 30.0, 44.0, 57.0, 77.0, 105.0, 131.0, 122.0, 107.0, 80.0, 42.0, 32.0, 43.0, 22.0, 8.0, 10.0, 4.0, 8.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1279296875, -1.090087890625, -1.05224609375, -1.014404296875, -0.9765625, -0.938720703125, -0.90087890625, -0.863037109375, -0.8251953125, -0.787353515625, -0.74951171875, -0.711669921875, -0.673828125, -0.635986328125, -0.59814453125, -0.560302734375, -0.5224609375, -0.484619140625, -0.44677734375, -0.408935546875, -0.37109375, -0.333251953125, -0.29541015625, -0.257568359375, -0.2197265625, -0.181884765625, -0.14404296875, -0.106201171875, -0.068359375, -0.030517578125, 0.00732421875, 0.045166015625, 0.0830078125, 0.120849609375, 0.15869140625, 0.196533203125, 0.234375, 0.272216796875, 0.31005859375, 0.347900390625, 0.3857421875, 0.423583984375, 0.46142578125, 0.499267578125, 0.537109375, 0.574951171875, 0.61279296875, 0.650634765625, 0.6884765625, 0.726318359375, 0.76416015625, 0.802001953125, 0.83984375, 0.877685546875, 0.91552734375, 0.953369140625, 0.9912109375, 1.029052734375, 1.06689453125, 1.104736328125, 1.142578125, 1.180419921875, 1.21826171875, 1.256103515625, 1.2939453125]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 7.0, 14.0, 17.0, 21.0, 55.0, 72.0, 110.0, 151.0, 157.0, 162.0, 97.0, 59.0, 42.0, 16.0, 17.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.332056999206543, -7.817634582519531, -7.3032121658325195, -6.788789749145508, -6.274367332458496, -5.759944915771484, -5.245522499084473, -4.731100082397461, -4.216677665710449, -3.7022552490234375, -3.187832832336426, -2.673410415649414, -2.1589879989624023, -1.6445655822753906, -1.130143165588379, -0.6157207489013672, -0.10129833221435547, 0.41312408447265625, 0.927546501159668, 1.4419689178466797, 1.9563913345336914, 2.470813751220703, 2.985236167907715, 3.4996585845947266, 4.014081001281738, 4.52850341796875, 5.042925834655762, 5.557348251342773, 6.071770668029785, 6.586193084716797, 7.100615501403809, 7.61503791809082, 8.129459381103516, 8.643881797790527, 9.158304214477539, 9.67272663116455, 10.187149047851562, 10.701571464538574, 11.215993881225586, 11.730416297912598, 12.24483871459961, 12.759261131286621, 13.273683547973633, 13.788105964660645, 14.302528381347656, 14.816950798034668, 15.33137321472168, 15.845795631408691, 16.360218048095703, 16.87464141845703, 17.389062881469727, 17.903484344482422, 18.41790771484375, 18.932331085205078, 19.446752548217773, 19.96117401123047, 20.475597381591797, 20.990020751953125, 21.50444221496582, 22.018863677978516, 22.533287048339844, 23.047710418701172, 23.562131881713867, 24.076553344726562, 24.59097671508789]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 9.0, 7.0, 10.0, 17.0, 17.0, 24.0, 31.0, 33.0, 43.0, 38.0, 51.0, 39.0, 52.0, 42.0, 39.0, 66.0, 64.0, 55.0, 52.0, 52.0, 35.0, 42.0, 30.0, 23.0, 25.0, 22.0, 14.0, 21.0, 13.0, 11.0, 10.0, 7.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.562973022460938, -11.183988571166992, -10.805004119873047, -10.426019668579102, -10.047036170959473, -9.668051719665527, -9.289067268371582, -8.910082817077637, -8.531098365783691, -8.152113914489746, -7.773129940032959, -7.394145488739014, -7.015161037445068, -6.636177062988281, -6.257192611694336, -5.878208160400391, -5.4992241859436035, -5.120239734649658, -4.741255760192871, -4.362271308898926, -3.9832868576049805, -3.6043026447296143, -3.225318431854248, -2.8463339805603027, -2.4673497676849365, -2.0883655548095703, -1.709381103515625, -1.3303968906402588, -0.951412558555603, -0.5724282264709473, -0.19344401359558105, 0.18554043769836426, 0.5645246505737305, 0.9435089826583862, 1.322493314743042, 1.7014775276184082, 2.0804619789123535, 2.4594461917877197, 2.838430404663086, 3.2174148559570312, 3.5963990688323975, 3.9753832817077637, 4.354367733001709, 4.733351707458496, 5.112336158752441, 5.491320610046387, 5.870305061340332, 6.249289512634277, 6.6282734870910645, 7.00725793838501, 7.386241912841797, 7.765226364135742, 8.144210815429688, 8.523195266723633, 8.902179718017578, 9.281164169311523, 9.660147666931152, 10.039132118225098, 10.418116569519043, 10.797100067138672, 11.176084518432617, 11.555068969726562, 11.934053421020508, 12.313037872314453, 12.692022323608398]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 5.0, 2.0, 2.0, 2.0, 3.0, 2.0, 4.0, 6.0, 9.0, 6.0, 12.0, 8.0, 24.0, 29.0, 56.0, 74.0, 150.0, 296.0, 618.0, 1636.0, 6240.0, 51202.0, 4096515.0, 30251.0, 4669.0, 1367.0, 532.0, 236.0, 134.0, 69.0, 41.0, 23.0, 16.0, 9.0, 9.0, 7.0, 5.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.5234375, -4.37939453125, -4.2353515625, -4.09130859375, -3.947265625, -3.80322265625, -3.6591796875, -3.51513671875, -3.37109375, -3.22705078125, -3.0830078125, -2.93896484375, -2.794921875, -2.65087890625, -2.5068359375, -2.36279296875, -2.21875, -2.07470703125, -1.9306640625, -1.78662109375, -1.642578125, -1.49853515625, -1.3544921875, -1.21044921875, -1.06640625, -0.92236328125, -0.7783203125, -0.63427734375, -0.490234375, -0.34619140625, -0.2021484375, -0.05810546875, 0.0859375, 0.22998046875, 0.3740234375, 0.51806640625, 0.662109375, 0.80615234375, 0.9501953125, 1.09423828125, 1.23828125, 1.38232421875, 1.5263671875, 1.67041015625, 1.814453125, 1.95849609375, 2.1025390625, 2.24658203125, 2.390625, 2.53466796875, 2.6787109375, 2.82275390625, 2.966796875, 3.11083984375, 3.2548828125, 3.39892578125, 3.54296875, 3.68701171875, 3.8310546875, 3.97509765625, 4.119140625, 4.26318359375, 4.4072265625, 4.55126953125, 4.6953125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 4.0, 2.0, 4.0, 5.0, 8.0, 20.0, 20.0, 18.0, 48.0, 60.0, 48.0, 84.0, 84.0, 100.0, 95.0, 91.0, 70.0, 68.0, 35.0, 51.0, 31.0, 17.0, 11.0, 12.0, 7.0, 3.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.90771484375, -0.8783721923828125, -0.849029541015625, -0.8196868896484375, -0.79034423828125, -0.7610015869140625, -0.731658935546875, -0.7023162841796875, -0.6729736328125, -0.6436309814453125, -0.614288330078125, -0.5849456787109375, -0.55560302734375, -0.5262603759765625, -0.496917724609375, -0.4675750732421875, -0.438232421875, -0.4088897705078125, -0.379547119140625, -0.3502044677734375, -0.32086181640625, -0.2915191650390625, -0.262176513671875, -0.2328338623046875, -0.2034912109375, -0.1741485595703125, -0.144805908203125, -0.1154632568359375, -0.08612060546875, -0.0567779541015625, -0.027435302734375, 0.0019073486328125, 0.03125, 0.0605926513671875, 0.089935302734375, 0.1192779541015625, 0.14862060546875, 0.1779632568359375, 0.207305908203125, 0.2366485595703125, 0.2659912109375, 0.2953338623046875, 0.324676513671875, 0.3540191650390625, 0.38336181640625, 0.4127044677734375, 0.442047119140625, 0.4713897705078125, 0.500732421875, 0.5300750732421875, 0.559417724609375, 0.5887603759765625, 0.61810302734375, 0.6474456787109375, 0.676788330078125, 0.7061309814453125, 0.7354736328125, 0.7648162841796875, 0.794158935546875, 0.8235015869140625, 0.85284423828125, 0.8821868896484375, 0.911529541015625, 0.9408721923828125, 0.97021484375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 2.0, 2.0, 5.0, 11.0, 17.0, 12.0, 22.0, 25.0, 25.0, 38.0, 54.0, 78.0, 76.0, 108.0, 146.0, 256.0, 379.0, 762.0, 1671.0, 4634.0, 22595.0, 3870615.0, 271619.0, 14341.0, 3618.0, 1305.0, 626.0, 353.0, 248.0, 168.0, 122.0, 86.0, 53.0, 48.0, 30.0, 27.0, 29.0, 17.0, 12.0, 7.0, 10.0, 13.0, 6.0, 4.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-3.953125, -3.82513427734375, -3.6971435546875, -3.56915283203125, -3.441162109375, -3.31317138671875, -3.1851806640625, -3.05718994140625, -2.92919921875, -2.80120849609375, -2.6732177734375, -2.54522705078125, -2.417236328125, -2.28924560546875, -2.1612548828125, -2.03326416015625, -1.9052734375, -1.77728271484375, -1.6492919921875, -1.52130126953125, -1.393310546875, -1.26531982421875, -1.1373291015625, -1.00933837890625, -0.88134765625, -0.75335693359375, -0.6253662109375, -0.49737548828125, -0.369384765625, -0.24139404296875, -0.1134033203125, 0.01458740234375, 0.142578125, 0.27056884765625, 0.3985595703125, 0.52655029296875, 0.654541015625, 0.78253173828125, 0.9105224609375, 1.03851318359375, 1.16650390625, 1.29449462890625, 1.4224853515625, 1.55047607421875, 1.678466796875, 1.80645751953125, 1.9344482421875, 2.06243896484375, 2.1904296875, 2.31842041015625, 2.4464111328125, 2.57440185546875, 2.702392578125, 2.83038330078125, 2.9583740234375, 3.08636474609375, 3.21435546875, 3.34234619140625, 3.4703369140625, 3.59832763671875, 3.726318359375, 3.85430908203125, 3.9822998046875, 4.11029052734375, 4.23828125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 2.0, 4.0, 6.0, 13.0, 26.0, 106.0, 3401.0, 426.0, 55.0, 19.0, 10.0, 5.0, 1.0, 4.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9326171875, -0.891876220703125, -0.85113525390625, -0.810394287109375, -0.7696533203125, -0.728912353515625, -0.68817138671875, -0.647430419921875, -0.606689453125, -0.565948486328125, -0.52520751953125, -0.484466552734375, -0.4437255859375, -0.402984619140625, -0.36224365234375, -0.321502685546875, -0.28076171875, -0.240020751953125, -0.19927978515625, -0.158538818359375, -0.1177978515625, -0.077056884765625, -0.03631591796875, 0.004425048828125, 0.045166015625, 0.085906982421875, 0.12664794921875, 0.167388916015625, 0.2081298828125, 0.248870849609375, 0.28961181640625, 0.330352783203125, 0.37109375, 0.411834716796875, 0.45257568359375, 0.493316650390625, 0.5340576171875, 0.574798583984375, 0.61553955078125, 0.656280517578125, 0.697021484375, 0.737762451171875, 0.77850341796875, 0.819244384765625, 0.8599853515625, 0.900726318359375, 0.94146728515625, 0.982208251953125, 1.02294921875, 1.063690185546875, 1.10443115234375, 1.145172119140625, 1.1859130859375, 1.226654052734375, 1.26739501953125, 1.308135986328125, 1.348876953125, 1.389617919921875, 1.43035888671875, 1.471099853515625, 1.5118408203125, 1.552581787109375, 1.59332275390625, 1.634063720703125, 1.6748046875]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 7.0, 17.0, 42.0, 72.0, 217.0, 314.0, 182.0, 94.0, 44.0, 7.0, 3.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0910727977752686, -2.906198263168335, -2.7213237285614014, -2.5364491939544678, -2.351574659347534, -2.1667001247406006, -1.9818254709243774, -1.7969509363174438, -1.6120764017105103, -1.4272018671035767, -1.242327332496643, -1.05745267868042, -0.8725782036781311, -0.6877036690711975, -0.5028290748596191, -0.31795454025268555, -0.13308000564575195, 0.051794543862342834, 0.23666909337043762, 0.4215436577796936, 0.6064181923866272, 0.7912927269935608, 0.9761673212051392, 1.1610418558120728, 1.3459163904190063, 1.53079092502594, 1.7156654596328735, 1.9005401134490967, 2.0854146480560303, 2.270289182662964, 2.4551637172698975, 2.640038251876831, 2.8249125480651855, 3.009787082672119, 3.1946616172790527, 3.3795361518859863, 3.56441068649292, 3.7492852210998535, 3.934159755706787, 4.119034290313721, 4.303908824920654, 4.488783359527588, 4.6736578941345215, 4.858532428741455, 5.043406963348389, 5.228281497955322, 5.413156032562256, 5.5980305671691895, 5.782905578613281, 5.967780113220215, 6.152654647827148, 6.337529182434082, 6.522403717041016, 6.707278251647949, 6.892152786254883, 7.077027320861816, 7.26190185546875, 7.446776390075684, 7.631650924682617, 7.816525459289551, 8.001399993896484, 8.186274528503418, 8.371149063110352, 8.556023597717285, 8.740898132324219]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 6.0, 6.0, 7.0, 5.0, 5.0, 21.0, 16.0, 17.0, 20.0, 27.0, 29.0, 28.0, 35.0, 31.0, 49.0, 44.0, 43.0, 56.0, 55.0, 55.0, 50.0, 43.0, 49.0, 46.0, 38.0, 36.0, 40.0, 25.0, 24.0, 16.0, 21.0, 22.0, 8.0, 11.0, 10.0, 2.0, 4.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.1871438026428223, -2.120305061340332, -2.053466558456421, -1.9866278171539307, -1.91978919506073, -1.8529505729675293, -1.7861119508743286, -1.719273328781128, -1.6524345874786377, -1.585595965385437, -1.5187573432922363, -1.451918601989746, -1.3850799798965454, -1.3182413578033447, -1.251402735710144, -1.1845641136169434, -1.1177254915237427, -1.050886869430542, -0.9840481877326965, -0.9172095656394958, -0.8503708839416504, -0.7835322618484497, -0.716693639755249, -0.6498550176620483, -0.5830163359642029, -0.5161777138710022, -0.44933903217315674, -0.38250041007995605, -0.315661758184433, -0.2488231062889099, -0.18198448419570923, -0.11514583230018616, -0.048307180404663086, 0.01853146404027939, 0.08537010848522186, 0.15220874547958374, 0.2190473973751068, 0.2858860492706299, 0.35272467136383057, 0.41956332325935364, 0.4864019751548767, 0.5532405972480774, 0.6200792789459229, 0.6869179010391235, 0.7537565231323242, 0.8205952048301697, 0.8874338269233704, 0.9542725086212158, 1.0211111307144165, 1.0879497528076172, 1.1547883749008179, 1.2216269969940186, 1.2884657382965088, 1.3553043603897095, 1.4221429824829102, 1.4889816045761108, 1.5558202266693115, 1.6226588487625122, 1.689497470855713, 1.7563362121582031, 1.8231748342514038, 1.8900134563446045, 1.9568520784378052, 2.023690700531006, 2.090529441833496]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 3.0, 4.0, 9.0, 10.0, 30.0, 20.0, 48.0, 107.0, 164.0, 270.0, 511.0, 1015.0, 2281.0, 5734.0, 17249.0, 60332.0, 224394.0, 452267.0, 204294.0, 54223.0, 15931.0, 5364.0, 2218.0, 993.0, 439.0, 281.0, 149.0, 72.0, 64.0, 40.0, 20.0, 10.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.205078125, -2.1326904296875, -2.060302734375, -1.9879150390625, -1.91552734375, -1.8431396484375, -1.770751953125, -1.6983642578125, -1.6259765625, -1.5535888671875, -1.481201171875, -1.4088134765625, -1.33642578125, -1.2640380859375, -1.191650390625, -1.1192626953125, -1.046875, -0.9744873046875, -0.902099609375, -0.8297119140625, -0.75732421875, -0.6849365234375, -0.612548828125, -0.5401611328125, -0.4677734375, -0.3953857421875, -0.322998046875, -0.2506103515625, -0.17822265625, -0.1058349609375, -0.033447265625, 0.0389404296875, 0.111328125, 0.1837158203125, 0.256103515625, 0.3284912109375, 0.40087890625, 0.4732666015625, 0.545654296875, 0.6180419921875, 0.6904296875, 0.7628173828125, 0.835205078125, 0.9075927734375, 0.97998046875, 1.0523681640625, 1.124755859375, 1.1971435546875, 1.26953125, 1.3419189453125, 1.414306640625, 1.4866943359375, 1.55908203125, 1.6314697265625, 1.703857421875, 1.7762451171875, 1.8486328125, 1.9210205078125, 1.993408203125, 2.0657958984375, 2.13818359375, 2.2105712890625, 2.282958984375, 2.3553466796875, 2.427734375]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 4.0, 1.0, 4.0, 9.0, 14.0, 15.0, 11.0, 28.0, 27.0, 46.0, 34.0, 47.0, 53.0, 68.0, 66.0, 68.0, 72.0, 76.0, 59.0, 44.0, 52.0, 49.0, 38.0, 24.0, 24.0, 24.0, 17.0, 10.0, 9.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.93896484375, -0.909515380859375, -0.88006591796875, -0.850616455078125, -0.8211669921875, -0.791717529296875, -0.76226806640625, -0.732818603515625, -0.703369140625, -0.673919677734375, -0.64447021484375, -0.615020751953125, -0.5855712890625, -0.556121826171875, -0.52667236328125, -0.497222900390625, -0.4677734375, -0.438323974609375, -0.40887451171875, -0.379425048828125, -0.3499755859375, -0.320526123046875, -0.29107666015625, -0.261627197265625, -0.232177734375, -0.202728271484375, -0.17327880859375, -0.143829345703125, -0.1143798828125, -0.084930419921875, -0.05548095703125, -0.026031494140625, 0.00341796875, 0.032867431640625, 0.06231689453125, 0.091766357421875, 0.1212158203125, 0.150665283203125, 0.18011474609375, 0.209564208984375, 0.239013671875, 0.268463134765625, 0.29791259765625, 0.327362060546875, 0.3568115234375, 0.386260986328125, 0.41571044921875, 0.445159912109375, 0.474609375, 0.504058837890625, 0.53350830078125, 0.562957763671875, 0.5924072265625, 0.621856689453125, 0.65130615234375, 0.680755615234375, 0.710205078125, 0.739654541015625, 0.76910400390625, 0.798553466796875, 0.8280029296875, 0.857452392578125, 0.88690185546875, 0.916351318359375, 0.94580078125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 9.0, 8.0, 13.0, 19.0, 21.0, 39.0, 52.0, 57.0, 103.0, 143.0, 265.0, 527.0, 1016.0, 2444.0, 6116.0, 17876.0, 70046.0, 373663.0, 457119.0, 85728.0, 21067.0, 6977.0, 2739.0, 1221.0, 537.0, 269.0, 148.0, 116.0, 65.0, 46.0, 28.0, 27.0, 25.0, 12.0, 5.0, 6.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.890625, -2.80047607421875, -2.7103271484375, -2.62017822265625, -2.530029296875, -2.43988037109375, -2.3497314453125, -2.25958251953125, -2.16943359375, -2.07928466796875, -1.9891357421875, -1.89898681640625, -1.808837890625, -1.71868896484375, -1.6285400390625, -1.53839111328125, -1.4482421875, -1.35809326171875, -1.2679443359375, -1.17779541015625, -1.087646484375, -0.99749755859375, -0.9073486328125, -0.81719970703125, -0.72705078125, -0.63690185546875, -0.5467529296875, -0.45660400390625, -0.366455078125, -0.27630615234375, -0.1861572265625, -0.09600830078125, -0.005859375, 0.08428955078125, 0.1744384765625, 0.26458740234375, 0.354736328125, 0.44488525390625, 0.5350341796875, 0.62518310546875, 0.71533203125, 0.80548095703125, 0.8956298828125, 0.98577880859375, 1.075927734375, 1.16607666015625, 1.2562255859375, 1.34637451171875, 1.4365234375, 1.52667236328125, 1.6168212890625, 1.70697021484375, 1.797119140625, 1.88726806640625, 1.9774169921875, 2.06756591796875, 2.15771484375, 2.24786376953125, 2.3380126953125, 2.42816162109375, 2.518310546875, 2.60845947265625, 2.6986083984375, 2.78875732421875, 2.87890625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 0.0, 1.0, 2.0, 5.0, 5.0, 9.0, 5.0, 5.0, 13.0, 12.0, 13.0, 17.0, 18.0, 23.0, 27.0, 36.0, 29.0, 49.0, 33.0, 51.0, 54.0, 51.0, 48.0, 54.0, 51.0, 40.0, 53.0, 50.0, 33.0, 41.0, 36.0, 28.0, 23.0, 14.0, 13.0, 13.0, 11.0, 4.0, 5.0, 6.0, 8.0, 4.0, 1.0, 6.0, 3.0, 0.0, 3.0, 5.0], "bins": [-4.78515625, -4.6619873046875, -4.538818359375, -4.4156494140625, -4.29248046875, -4.1693115234375, -4.046142578125, -3.9229736328125, -3.7998046875, -3.6766357421875, -3.553466796875, -3.4302978515625, -3.30712890625, -3.1839599609375, -3.060791015625, -2.9376220703125, -2.814453125, -2.6912841796875, -2.568115234375, -2.4449462890625, -2.32177734375, -2.1986083984375, -2.075439453125, -1.9522705078125, -1.8291015625, -1.7059326171875, -1.582763671875, -1.4595947265625, -1.33642578125, -1.2132568359375, -1.090087890625, -0.9669189453125, -0.84375, -0.7205810546875, -0.597412109375, -0.4742431640625, -0.35107421875, -0.2279052734375, -0.104736328125, 0.0184326171875, 0.1416015625, 0.2647705078125, 0.387939453125, 0.5111083984375, 0.63427734375, 0.7574462890625, 0.880615234375, 1.0037841796875, 1.126953125, 1.2501220703125, 1.373291015625, 1.4964599609375, 1.61962890625, 1.7427978515625, 1.865966796875, 1.9891357421875, 2.1123046875, 2.2354736328125, 2.358642578125, 2.4818115234375, 2.60498046875, 2.7281494140625, 2.851318359375, 2.9744873046875, 3.09765625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 8.0, 12.0, 16.0, 19.0, 64.0, 124.0, 308.0, 1087.0, 7519.0, 1012012.0, 24793.0, 1871.0, 424.0, 161.0, 62.0, 31.0, 17.0, 15.0, 4.0, 6.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.8203125, -7.6126708984375, -7.405029296875, -7.1973876953125, -6.98974609375, -6.7821044921875, -6.574462890625, -6.3668212890625, -6.1591796875, -5.9515380859375, -5.743896484375, -5.5362548828125, -5.32861328125, -5.1209716796875, -4.913330078125, -4.7056884765625, -4.498046875, -4.2904052734375, -4.082763671875, -3.8751220703125, -3.66748046875, -3.4598388671875, -3.252197265625, -3.0445556640625, -2.8369140625, -2.6292724609375, -2.421630859375, -2.2139892578125, -2.00634765625, -1.7987060546875, -1.591064453125, -1.3834228515625, -1.17578125, -0.9681396484375, -0.760498046875, -0.5528564453125, -0.34521484375, -0.1375732421875, 0.070068359375, 0.2777099609375, 0.4853515625, 0.6929931640625, 0.900634765625, 1.1082763671875, 1.31591796875, 1.5235595703125, 1.731201171875, 1.9388427734375, 2.146484375, 2.3541259765625, 2.561767578125, 2.7694091796875, 2.97705078125, 3.1846923828125, 3.392333984375, 3.5999755859375, 3.8076171875, 4.0152587890625, 4.222900390625, 4.4305419921875, 4.63818359375, 4.8458251953125, 5.053466796875, 5.2611083984375, 5.46875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 0.0, 9.0, 4.0, 20.0, 27.0, 48.0, 88.0, 99.0, 151.0, 164.0, 136.0, 109.0, 53.0, 35.0, 16.0, 18.0, 7.0, 8.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00028228759765625, -0.0002748984843492508, -0.0002675093710422516, -0.0002601202577352524, -0.0002527311444282532, -0.00024534203112125397, -0.00023795291781425476, -0.00023056380450725555, -0.00022317469120025635, -0.00021578557789325714, -0.00020839646458625793, -0.00020100735127925873, -0.00019361823797225952, -0.00018622912466526031, -0.0001788400113582611, -0.0001714508980512619, -0.0001640617847442627, -0.0001566726714372635, -0.00014928355813026428, -0.00014189444482326508, -0.00013450533151626587, -0.00012711621820926666, -0.00011972710490226746, -0.00011233799159526825, -0.00010494887828826904, -9.755976498126984e-05, -9.017065167427063e-05, -8.278153836727142e-05, -7.539242506027222e-05, -6.800331175327301e-05, -6.0614198446273804e-05, -5.32250851392746e-05, -4.583597183227539e-05, -3.8446858525276184e-05, -3.105774521827698e-05, -2.366863191127777e-05, -1.6279518604278564e-05, -8.890405297279358e-06, -1.5012919902801514e-06, 5.887821316719055e-06, 1.3276934623718262e-05, 2.0666047930717468e-05, 2.8055161237716675e-05, 3.544427454471588e-05, 4.283338785171509e-05, 5.0222501158714294e-05, 5.76116144657135e-05, 6.500072777271271e-05, 7.238984107971191e-05, 7.977895438671112e-05, 8.716806769371033e-05, 9.455718100070953e-05, 0.00010194629430770874, 0.00010933540761470795, 0.00011672452092170715, 0.00012411363422870636, 0.00013150274753570557, 0.00013889186084270477, 0.00014628097414970398, 0.00015367008745670319, 0.0001610592007637024, 0.0001684483140707016, 0.0001758374273777008, 0.0001832265406847, 0.00019061565399169922]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 3.0, 5.0, 4.0, 10.0, 15.0, 33.0, 61.0, 92.0, 195.0, 476.0, 1209.0, 4130.0, 47458.0, 949587.0, 39361.0, 3872.0, 1177.0, 478.0, 195.0, 106.0, 43.0, 18.0, 14.0, 6.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.064453125, -2.9700927734375, -2.875732421875, -2.7813720703125, -2.68701171875, -2.5926513671875, -2.498291015625, -2.4039306640625, -2.3095703125, -2.2152099609375, -2.120849609375, -2.0264892578125, -1.93212890625, -1.8377685546875, -1.743408203125, -1.6490478515625, -1.5546875, -1.4603271484375, -1.365966796875, -1.2716064453125, -1.17724609375, -1.0828857421875, -0.988525390625, -0.8941650390625, -0.7998046875, -0.7054443359375, -0.611083984375, -0.5167236328125, -0.42236328125, -0.3280029296875, -0.233642578125, -0.1392822265625, -0.044921875, 0.0494384765625, 0.143798828125, 0.2381591796875, 0.33251953125, 0.4268798828125, 0.521240234375, 0.6156005859375, 0.7099609375, 0.8043212890625, 0.898681640625, 0.9930419921875, 1.08740234375, 1.1817626953125, 1.276123046875, 1.3704833984375, 1.46484375, 1.5592041015625, 1.653564453125, 1.7479248046875, 1.84228515625, 1.9366455078125, 2.031005859375, 2.1253662109375, 2.2197265625, 2.3140869140625, 2.408447265625, 2.5028076171875, 2.59716796875, 2.6915283203125, 2.785888671875, 2.8802490234375, 2.974609375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 8.0, 7.0, 13.0, 11.0, 22.0, 62.0, 108.0, 220.0, 252.0, 143.0, 74.0, 35.0, 19.0, 9.0, 6.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.513671875, -2.413848876953125, -2.31402587890625, -2.214202880859375, -2.1143798828125, -2.014556884765625, -1.91473388671875, -1.814910888671875, -1.715087890625, -1.615264892578125, -1.51544189453125, -1.415618896484375, -1.3157958984375, -1.215972900390625, -1.11614990234375, -1.016326904296875, -0.91650390625, -0.816680908203125, -0.71685791015625, -0.617034912109375, -0.5172119140625, -0.417388916015625, -0.31756591796875, -0.217742919921875, -0.117919921875, -0.018096923828125, 0.08172607421875, 0.181549072265625, 0.2813720703125, 0.381195068359375, 0.48101806640625, 0.580841064453125, 0.6806640625, 0.780487060546875, 0.88031005859375, 0.980133056640625, 1.0799560546875, 1.179779052734375, 1.27960205078125, 1.379425048828125, 1.479248046875, 1.579071044921875, 1.67889404296875, 1.778717041015625, 1.8785400390625, 1.978363037109375, 2.07818603515625, 2.178009033203125, 2.27783203125, 2.377655029296875, 2.47747802734375, 2.577301025390625, 2.6771240234375, 2.776947021484375, 2.87677001953125, 2.976593017578125, 3.076416015625, 3.176239013671875, 3.27606201171875, 3.375885009765625, 3.4757080078125, 3.575531005859375, 3.67535400390625, 3.775177001953125, 3.875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 6.0, 6.0, 7.0, 17.0, 16.0, 32.0, 26.0, 44.0, 53.0, 51.0, 68.0, 95.0, 115.0, 91.0, 72.0, 54.0, 69.0, 51.0, 42.0, 16.0, 20.0, 22.0, 7.0, 9.0, 5.0, 4.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.282142639160156, -16.755569458007812, -16.2289981842041, -15.702425003051758, -15.17585277557373, -14.649280548095703, -14.12270736694336, -13.596135139465332, -13.069562911987305, -12.542990684509277, -12.016417503356934, -11.489845275878906, -10.963273048400879, -10.436700820922852, -9.910127639770508, -9.38355541229248, -8.856982231140137, -8.33041000366211, -7.803837299346924, -7.277264595031738, -6.750692367553711, -6.224119663238525, -5.69754695892334, -5.1709747314453125, -4.644402027130127, -4.117829322814941, -3.591257095336914, -3.0646843910217285, -2.538111925125122, -2.0115394592285156, -1.48496675491333, -0.9583942890167236, -0.4318218231201172, 0.09475070238113403, 0.6213232278823853, 1.1478958129882812, 1.6744682788848877, 2.201040744781494, 2.7276134490966797, 3.254185914993286, 3.7807583808898926, 4.307331085205078, 4.8339033126831055, 5.360476016998291, 5.887048721313477, 6.413620948791504, 6.9401936531066895, 7.466766357421875, 7.993338584899902, 8.51991081237793, 9.046483993530273, 9.5730562210083, 10.099628448486328, 10.626201629638672, 11.1527738571167, 11.679346084594727, 12.20591926574707, 12.732491493225098, 13.259064674377441, 13.785636901855469, 14.312209129333496, 14.838781356811523, 15.365354537963867, 15.891926765441895, 16.418498992919922]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 5.0, 5.0, 8.0, 10.0, 7.0, 10.0, 8.0, 12.0, 10.0, 20.0, 18.0, 31.0, 25.0, 36.0, 38.0, 44.0, 36.0, 49.0, 53.0, 44.0, 60.0, 35.0, 45.0, 37.0, 48.0, 33.0, 24.0, 33.0, 32.0, 30.0, 24.0, 21.0, 17.0, 21.0, 12.0, 12.0, 6.0, 7.0, 7.0, 9.0, 8.0, 3.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.726259231567383, -17.16609001159668, -16.605920791625977, -16.045751571655273, -15.485581398010254, -14.92541217803955, -14.365242004394531, -13.805072784423828, -13.244903564453125, -12.684734344482422, -12.124565124511719, -11.5643949508667, -11.004225730895996, -10.444056510925293, -9.883886337280273, -9.32371711730957, -8.763547897338867, -8.203378677368164, -7.643208980560303, -7.083039283752441, -6.522870063781738, -5.962700843811035, -5.402531147003174, -4.8423614501953125, -4.282192230224609, -3.722022771835327, -3.161853313446045, -2.6016838550567627, -2.0415143966674805, -1.4813449382781982, -0.921175479888916, -0.3610060214996338, 0.19916534423828125, 0.7593348026275635, 1.3195042610168457, 1.879673719406128, 2.43984317779541, 3.0000126361846924, 3.5601820945739746, 4.120351791381836, 4.680521011352539, 5.240690231323242, 5.8008599281311035, 6.361029624938965, 6.921198844909668, 7.481368064880371, 8.04153823852539, 8.601707458496094, 9.161876678466797, 9.7220458984375, 10.282215118408203, 10.842385292053223, 11.402554512023926, 11.962723731994629, 12.522893905639648, 13.083063125610352, 13.643232345581055, 14.203401565551758, 14.763570785522461, 15.32374095916748, 15.883910179138184, 16.444080352783203, 17.004249572753906, 17.56441879272461, 18.124588012695312]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 4.0, 8.0, 12.0, 7.0, 8.0, 21.0, 24.0, 53.0, 55.0, 83.0, 160.0, 178.0, 300.0, 524.0, 966.0, 2013.0, 5072.0, 16349.0, 111334.0, 4005365.0, 36108.0, 8989.0, 3228.0, 1409.0, 726.0, 404.0, 306.0, 191.0, 132.0, 70.0, 53.0, 44.0, 19.0, 20.0, 14.0, 16.0, 7.0, 6.0, 6.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.076171875, -2.974517822265625, -2.87286376953125, -2.771209716796875, -2.6695556640625, -2.567901611328125, -2.46624755859375, -2.364593505859375, -2.262939453125, -2.161285400390625, -2.05963134765625, -1.957977294921875, -1.8563232421875, -1.754669189453125, -1.65301513671875, -1.551361083984375, -1.44970703125, -1.348052978515625, -1.24639892578125, -1.144744873046875, -1.0430908203125, -0.941436767578125, -0.83978271484375, -0.738128662109375, -0.636474609375, -0.534820556640625, -0.43316650390625, -0.331512451171875, -0.2298583984375, -0.128204345703125, -0.02655029296875, 0.075103759765625, 0.1767578125, 0.278411865234375, 0.38006591796875, 0.481719970703125, 0.5833740234375, 0.685028076171875, 0.78668212890625, 0.888336181640625, 0.989990234375, 1.091644287109375, 1.19329833984375, 1.294952392578125, 1.3966064453125, 1.498260498046875, 1.59991455078125, 1.701568603515625, 1.80322265625, 1.904876708984375, 2.00653076171875, 2.108184814453125, 2.2098388671875, 2.311492919921875, 2.41314697265625, 2.514801025390625, 2.616455078125, 2.718109130859375, 2.81976318359375, 2.921417236328125, 3.0230712890625, 3.124725341796875, 3.22637939453125, 3.328033447265625, 3.4296875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 3.0, 6.0, 7.0, 10.0, 13.0, 17.0, 18.0, 20.0, 32.0, 44.0, 51.0, 70.0, 62.0, 64.0, 64.0, 57.0, 78.0, 62.0, 51.0, 47.0, 52.0, 39.0, 35.0, 18.0, 18.0, 19.0, 13.0, 3.0, 8.0, 7.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.9716796875, -0.939422607421875, -0.90716552734375, -0.874908447265625, -0.8426513671875, -0.810394287109375, -0.77813720703125, -0.745880126953125, -0.713623046875, -0.681365966796875, -0.64910888671875, -0.616851806640625, -0.5845947265625, -0.552337646484375, -0.52008056640625, -0.487823486328125, -0.45556640625, -0.423309326171875, -0.39105224609375, -0.358795166015625, -0.3265380859375, -0.294281005859375, -0.26202392578125, -0.229766845703125, -0.197509765625, -0.165252685546875, -0.13299560546875, -0.100738525390625, -0.0684814453125, -0.036224365234375, -0.00396728515625, 0.028289794921875, 0.060546875, 0.092803955078125, 0.12506103515625, 0.157318115234375, 0.1895751953125, 0.221832275390625, 0.25408935546875, 0.286346435546875, 0.318603515625, 0.350860595703125, 0.38311767578125, 0.415374755859375, 0.4476318359375, 0.479888916015625, 0.51214599609375, 0.544403076171875, 0.57666015625, 0.608917236328125, 0.64117431640625, 0.673431396484375, 0.7056884765625, 0.737945556640625, 0.77020263671875, 0.802459716796875, 0.834716796875, 0.866973876953125, 0.89923095703125, 0.931488037109375, 0.9637451171875, 0.996002197265625, 1.02825927734375, 1.060516357421875, 1.0927734375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 2.0, 4.0, 15.0, 10.0, 10.0, 19.0, 25.0, 33.0, 46.0, 75.0, 99.0, 139.0, 182.0, 253.0, 383.0, 682.0, 1146.0, 2166.0, 4221.0, 9329.0, 24707.0, 98071.0, 3856366.0, 144230.0, 30360.0, 10957.0, 4788.0, 2463.0, 1261.0, 769.0, 424.0, 319.0, 205.0, 149.0, 98.0, 79.0, 44.0, 31.0, 28.0, 20.0, 18.0, 17.0, 9.0, 2.0, 8.0, 4.0, 2.0, 8.0, 5.0, 1.0, 2.0], "bins": [-2.833984375, -2.754364013671875, -2.67474365234375, -2.595123291015625, -2.5155029296875, -2.435882568359375, -2.35626220703125, -2.276641845703125, -2.197021484375, -2.117401123046875, -2.03778076171875, -1.958160400390625, -1.8785400390625, -1.798919677734375, -1.71929931640625, -1.639678955078125, -1.56005859375, -1.480438232421875, -1.40081787109375, -1.321197509765625, -1.2415771484375, -1.161956787109375, -1.08233642578125, -1.002716064453125, -0.923095703125, -0.843475341796875, -0.76385498046875, -0.684234619140625, -0.6046142578125, -0.524993896484375, -0.44537353515625, -0.365753173828125, -0.2861328125, -0.206512451171875, -0.12689208984375, -0.047271728515625, 0.0323486328125, 0.111968994140625, 0.19158935546875, 0.271209716796875, 0.350830078125, 0.430450439453125, 0.51007080078125, 0.589691162109375, 0.6693115234375, 0.748931884765625, 0.82855224609375, 0.908172607421875, 0.98779296875, 1.067413330078125, 1.14703369140625, 1.226654052734375, 1.3062744140625, 1.385894775390625, 1.46551513671875, 1.545135498046875, 1.624755859375, 1.704376220703125, 1.78399658203125, 1.863616943359375, 1.9432373046875, 2.022857666015625, 2.10247802734375, 2.182098388671875, 2.26171875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 4.0, 5.0, 7.0, 9.0, 23.0, 45.0, 48.0, 156.0, 3257.0, 314.0, 84.0, 45.0, 28.0, 18.0, 7.0, 9.0, 8.0, 2.0, 5.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.220703125, -1.1884002685546875, -1.156097412109375, -1.1237945556640625, -1.09149169921875, -1.0591888427734375, -1.026885986328125, -0.9945831298828125, -0.9622802734375, -0.9299774169921875, -0.897674560546875, -0.8653717041015625, -0.83306884765625, -0.8007659912109375, -0.768463134765625, -0.7361602783203125, -0.703857421875, -0.6715545654296875, -0.639251708984375, -0.6069488525390625, -0.57464599609375, -0.5423431396484375, -0.510040283203125, -0.4777374267578125, -0.4454345703125, -0.4131317138671875, -0.380828857421875, -0.3485260009765625, -0.31622314453125, -0.2839202880859375, -0.251617431640625, -0.2193145751953125, -0.18701171875, -0.1547088623046875, -0.122406005859375, -0.0901031494140625, -0.05780029296875, -0.0254974365234375, 0.006805419921875, 0.0391082763671875, 0.0714111328125, 0.1037139892578125, 0.136016845703125, 0.1683197021484375, 0.20062255859375, 0.2329254150390625, 0.265228271484375, 0.2975311279296875, 0.329833984375, 0.3621368408203125, 0.394439697265625, 0.4267425537109375, 0.45904541015625, 0.4913482666015625, 0.523651123046875, 0.5559539794921875, 0.5882568359375, 0.6205596923828125, 0.652862548828125, 0.6851654052734375, 0.71746826171875, 0.7497711181640625, 0.782073974609375, 0.8143768310546875, 0.8466796875]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 8.0, 7.0, 13.0, 21.0, 37.0, 53.0, 54.0, 78.0, 92.0, 111.0, 98.0, 114.0, 97.0, 73.0, 60.0, 42.0, 12.0, 20.0, 6.0, 5.0, 5.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5895838737487793, -3.4941811561584473, -3.398778200149536, -3.303375482559204, -3.207972526550293, -3.112569808959961, -3.017167091369629, -2.9217641353607178, -2.8263611793518066, -2.7309584617614746, -2.6355555057525635, -2.5401527881622314, -2.4447498321533203, -2.3493471145629883, -2.2539443969726562, -2.158541440963745, -2.063138723373413, -1.9677358865737915, -1.87233304977417, -1.776930332183838, -1.6815273761749268, -1.5861246585845947, -1.4907218217849731, -1.3953189849853516, -1.29991614818573, -1.2045133113861084, -1.1091104745864868, -1.0137076377868652, -0.9183048605918884, -0.8229020237922668, -0.72749924659729, -0.6320964097976685, -0.5366935729980469, -0.4412907361984253, -0.3458879292011261, -0.2504851222038269, -0.15508228540420532, -0.05967944860458374, 0.035723328590393066, 0.13112616539001465, 0.22652900218963623, 0.3219318389892578, 0.417334645986557, 0.5127374529838562, 0.6081402897834778, 0.7035431265830994, 0.7989459037780762, 0.8943487405776978, 0.9897515773773193, 1.085154414176941, 1.1805572509765625, 1.2759599685668945, 1.3713629245758057, 1.4667656421661377, 1.5621684789657593, 1.6575713157653809, 1.7529741525650024, 1.848376989364624, 1.9437798261642456, 2.039182662963867, 2.134585380554199, 2.2299883365631104, 2.3253910541534424, 2.4207940101623535, 2.5161967277526855]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 5.0, 5.0, 3.0, 6.0, 6.0, 11.0, 22.0, 14.0, 28.0, 26.0, 26.0, 23.0, 32.0, 40.0, 32.0, 32.0, 45.0, 43.0, 40.0, 50.0, 46.0, 56.0, 40.0, 34.0, 55.0, 51.0, 36.0, 35.0, 29.0, 18.0, 23.0, 17.0, 19.0, 9.0, 7.0, 10.0, 7.0, 12.0, 4.0, 4.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.9960172176361084, -1.9374629259109497, -1.8789085149765015, -1.8203542232513428, -1.761799931526184, -1.7032456398010254, -1.6446912288665771, -1.5861369371414185, -1.5275826454162598, -1.469028353691101, -1.4104739427566528, -1.3519196510314941, -1.2933653593063354, -1.2348110675811768, -1.1762566566467285, -1.1177023649215698, -1.0591480731964111, -1.0005937814712524, -0.942039430141449, -0.8834850788116455, -0.8249307870864868, -0.7663764357566833, -0.7078220844268799, -0.6492677927017212, -0.590713381767273, -0.5321590304374695, -0.4736047387123108, -0.4150503873825073, -0.35649609565734863, -0.29794174432754517, -0.2393874228000641, -0.180833101272583, -0.12227880954742432, -0.06372448801994324, -0.005170159041881561, 0.053384169936180115, 0.1119384914636612, 0.17049282789230347, 0.22904714941978455, 0.2876014709472656, 0.3461557924747467, 0.4047101140022278, 0.46326443552970886, 0.5218187570571899, 0.5803731083869934, 0.6389274597167969, 0.6974817514419556, 0.7560360431671143, 0.8145903944969177, 0.8731447458267212, 0.9316990375518799, 0.9902533888816833, 1.0488077402114868, 1.1073620319366455, 1.1659163236618042, 1.224470615386963, 1.2830250263214111, 1.3415793180465698, 1.400133728981018, 1.4586880207061768, 1.5172423124313354, 1.5757966041564941, 1.6343510150909424, 1.692905306816101, 1.7514595985412598]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 5.0, 8.0, 4.0, 9.0, 17.0, 25.0, 42.0, 62.0, 69.0, 117.0, 172.0, 282.0, 449.0, 777.0, 1381.0, 2470.0, 4807.0, 10066.0, 22641.0, 56024.0, 140962.0, 288561.0, 283734.0, 138478.0, 54614.0, 22130.0, 9854.0, 4856.0, 2541.0, 1359.0, 757.0, 455.0, 291.0, 175.0, 122.0, 92.0, 45.0, 46.0, 17.0, 14.0, 13.0, 2.0, 6.0, 6.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.6904296875, -1.6358795166015625, -1.581329345703125, -1.5267791748046875, -1.47222900390625, -1.4176788330078125, -1.363128662109375, -1.3085784912109375, -1.2540283203125, -1.1994781494140625, -1.144927978515625, -1.0903778076171875, -1.03582763671875, -0.9812774658203125, -0.926727294921875, -0.8721771240234375, -0.817626953125, -0.7630767822265625, -0.708526611328125, -0.6539764404296875, -0.59942626953125, -0.5448760986328125, -0.490325927734375, -0.4357757568359375, -0.3812255859375, -0.3266754150390625, -0.272125244140625, -0.2175750732421875, -0.16302490234375, -0.1084747314453125, -0.053924560546875, 0.0006256103515625, 0.05517578125, 0.1097259521484375, 0.164276123046875, 0.2188262939453125, 0.27337646484375, 0.3279266357421875, 0.382476806640625, 0.4370269775390625, 0.4915771484375, 0.5461273193359375, 0.600677490234375, 0.6552276611328125, 0.70977783203125, 0.7643280029296875, 0.818878173828125, 0.8734283447265625, 0.927978515625, 0.9825286865234375, 1.037078857421875, 1.0916290283203125, 1.14617919921875, 1.2007293701171875, 1.255279541015625, 1.3098297119140625, 1.3643798828125, 1.4189300537109375, 1.473480224609375, 1.5280303955078125, 1.58258056640625, 1.6371307373046875, 1.691680908203125, 1.7462310791015625, 1.80078125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 5.0, 3.0, 7.0, 4.0, 9.0, 8.0, 11.0, 14.0, 19.0, 28.0, 34.0, 37.0, 42.0, 50.0, 55.0, 47.0, 65.0, 65.0, 67.0, 54.0, 53.0, 49.0, 46.0, 41.0, 42.0, 24.0, 32.0, 22.0, 16.0, 11.0, 9.0, 13.0, 3.0, 5.0, 0.0, 5.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.013671875, -0.9827423095703125, -0.951812744140625, -0.9208831787109375, -0.88995361328125, -0.8590240478515625, -0.828094482421875, -0.7971649169921875, -0.7662353515625, -0.7353057861328125, -0.704376220703125, -0.6734466552734375, -0.64251708984375, -0.6115875244140625, -0.580657958984375, -0.5497283935546875, -0.518798828125, -0.4878692626953125, -0.456939697265625, -0.4260101318359375, -0.39508056640625, -0.3641510009765625, -0.333221435546875, -0.3022918701171875, -0.2713623046875, -0.2404327392578125, -0.209503173828125, -0.1785736083984375, -0.14764404296875, -0.1167144775390625, -0.085784912109375, -0.0548553466796875, -0.02392578125, 0.0070037841796875, 0.037933349609375, 0.0688629150390625, 0.09979248046875, 0.1307220458984375, 0.161651611328125, 0.1925811767578125, 0.2235107421875, 0.2544403076171875, 0.285369873046875, 0.3162994384765625, 0.34722900390625, 0.3781585693359375, 0.409088134765625, 0.4400177001953125, 0.470947265625, 0.5018768310546875, 0.532806396484375, 0.5637359619140625, 0.59466552734375, 0.6255950927734375, 0.656524658203125, 0.6874542236328125, 0.7183837890625, 0.7493133544921875, 0.780242919921875, 0.8111724853515625, 0.84210205078125, 0.8730316162109375, 0.903961181640625, 0.9348907470703125, 0.9658203125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 2.0, 6.0, 3.0, 8.0, 14.0, 12.0, 18.0, 30.0, 44.0, 83.0, 136.0, 235.0, 446.0, 849.0, 2099.0, 5715.0, 21016.0, 114378.0, 597073.0, 252189.0, 39528.0, 9219.0, 2959.0, 1261.0, 565.0, 261.0, 135.0, 96.0, 46.0, 35.0, 22.0, 21.0, 18.0, 9.0, 10.0, 6.0, 4.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.89453125, -3.791229248046875, -3.68792724609375, -3.584625244140625, -3.4813232421875, -3.378021240234375, -3.27471923828125, -3.171417236328125, -3.068115234375, -2.964813232421875, -2.86151123046875, -2.758209228515625, -2.6549072265625, -2.551605224609375, -2.44830322265625, -2.345001220703125, -2.24169921875, -2.138397216796875, -2.03509521484375, -1.931793212890625, -1.8284912109375, -1.725189208984375, -1.62188720703125, -1.518585205078125, -1.415283203125, -1.311981201171875, -1.20867919921875, -1.105377197265625, -1.0020751953125, -0.898773193359375, -0.79547119140625, -0.692169189453125, -0.5888671875, -0.485565185546875, -0.38226318359375, -0.278961181640625, -0.1756591796875, -0.072357177734375, 0.03094482421875, 0.134246826171875, 0.237548828125, 0.340850830078125, 0.44415283203125, 0.547454833984375, 0.6507568359375, 0.754058837890625, 0.85736083984375, 0.960662841796875, 1.06396484375, 1.167266845703125, 1.27056884765625, 1.373870849609375, 1.4771728515625, 1.580474853515625, 1.68377685546875, 1.787078857421875, 1.890380859375, 1.993682861328125, 2.09698486328125, 2.200286865234375, 2.3035888671875, 2.406890869140625, 2.51019287109375, 2.613494873046875, 2.716796875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 2.0, 8.0, 9.0, 22.0, 28.0, 19.0, 33.0, 29.0, 39.0, 44.0, 64.0, 60.0, 56.0, 77.0, 72.0, 65.0, 68.0, 58.0, 50.0, 39.0, 34.0, 33.0, 27.0, 12.0, 16.0, 8.0, 10.0, 3.0, 4.0, 3.0, 2.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.7890625, -5.61956787109375, -5.4500732421875, -5.28057861328125, -5.111083984375, -4.94158935546875, -4.7720947265625, -4.60260009765625, -4.43310546875, -4.26361083984375, -4.0941162109375, -3.92462158203125, -3.755126953125, -3.58563232421875, -3.4161376953125, -3.24664306640625, -3.0771484375, -2.90765380859375, -2.7381591796875, -2.56866455078125, -2.399169921875, -2.22967529296875, -2.0601806640625, -1.89068603515625, -1.72119140625, -1.55169677734375, -1.3822021484375, -1.21270751953125, -1.043212890625, -0.87371826171875, -0.7042236328125, -0.53472900390625, -0.365234375, -0.19573974609375, -0.0262451171875, 0.14324951171875, 0.312744140625, 0.48223876953125, 0.6517333984375, 0.82122802734375, 0.99072265625, 1.16021728515625, 1.3297119140625, 1.49920654296875, 1.668701171875, 1.83819580078125, 2.0076904296875, 2.17718505859375, 2.3466796875, 2.51617431640625, 2.6856689453125, 2.85516357421875, 3.024658203125, 3.19415283203125, 3.3636474609375, 3.53314208984375, 3.70263671875, 3.87213134765625, 4.0416259765625, 4.21112060546875, 4.380615234375, 4.55010986328125, 4.7196044921875, 4.88909912109375, 5.05859375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 9.0, 16.0, 44.0, 49.0, 130.0, 250.0, 764.0, 2911.0, 26775.0, 885850.0, 123724.0, 6099.0, 1259.0, 376.0, 146.0, 70.0, 32.0, 24.0, 13.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.591796875, -3.4852294921875, -3.378662109375, -3.2720947265625, -3.16552734375, -3.0589599609375, -2.952392578125, -2.8458251953125, -2.7392578125, -2.6326904296875, -2.526123046875, -2.4195556640625, -2.31298828125, -2.2064208984375, -2.099853515625, -1.9932861328125, -1.88671875, -1.7801513671875, -1.673583984375, -1.5670166015625, -1.46044921875, -1.3538818359375, -1.247314453125, -1.1407470703125, -1.0341796875, -0.9276123046875, -0.821044921875, -0.7144775390625, -0.60791015625, -0.5013427734375, -0.394775390625, -0.2882080078125, -0.181640625, -0.0750732421875, 0.031494140625, 0.1380615234375, 0.24462890625, 0.3511962890625, 0.457763671875, 0.5643310546875, 0.6708984375, 0.7774658203125, 0.884033203125, 0.9906005859375, 1.09716796875, 1.2037353515625, 1.310302734375, 1.4168701171875, 1.5234375, 1.6300048828125, 1.736572265625, 1.8431396484375, 1.94970703125, 2.0562744140625, 2.162841796875, 2.2694091796875, 2.3759765625, 2.4825439453125, 2.589111328125, 2.6956787109375, 2.80224609375, 2.9088134765625, 3.015380859375, 3.1219482421875, 3.228515625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 5.0, 4.0, 14.0, 16.0, 20.0, 27.0, 34.0, 58.0, 77.0, 115.0, 125.0, 110.0, 112.0, 80.0, 59.0, 50.0, 34.0, 19.0, 11.0, 7.0, 7.0, 4.0, 7.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0002899169921875, -0.0002820640802383423, -0.00027421116828918457, -0.00026635825634002686, -0.00025850534439086914, -0.0002506524324417114, -0.0002427995204925537, -0.000234946608543396, -0.00022709369659423828, -0.00021924078464508057, -0.00021138787269592285, -0.00020353496074676514, -0.00019568204879760742, -0.0001878291368484497, -0.000179976224899292, -0.00017212331295013428, -0.00016427040100097656, -0.00015641748905181885, -0.00014856457710266113, -0.00014071166515350342, -0.0001328587532043457, -0.000125005841255188, -0.00011715292930603027, -0.00010930001735687256, -0.00010144710540771484, -9.359419345855713e-05, -8.574128150939941e-05, -7.78883695602417e-05, -7.003545761108398e-05, -6.218254566192627e-05, -5.4329633712768555e-05, -4.647672176361084e-05, -3.8623809814453125e-05, -3.077089786529541e-05, -2.2917985916137695e-05, -1.506507396697998e-05, -7.212162017822266e-06, 6.407499313354492e-07, 8.493661880493164e-06, 1.634657382965088e-05, 2.4199485778808594e-05, 3.205239772796631e-05, 3.9905309677124023e-05, 4.775822162628174e-05, 5.561113357543945e-05, 6.346404552459717e-05, 7.131695747375488e-05, 7.91698694229126e-05, 8.702278137207031e-05, 9.487569332122803e-05, 0.00010272860527038574, 0.00011058151721954346, 0.00011843442916870117, 0.0001262873411178589, 0.0001341402530670166, 0.00014199316501617432, 0.00014984607696533203, 0.00015769898891448975, 0.00016555190086364746, 0.00017340481281280518, 0.0001812577247619629, 0.0001891106367111206, 0.00019696354866027832, 0.00020481646060943604, 0.00021266937255859375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 4.0, 3.0, 5.0, 9.0, 10.0, 14.0, 19.0, 39.0, 74.0, 129.0, 281.0, 670.0, 2086.0, 13223.0, 422643.0, 588630.0, 16800.0, 2527.0, 727.0, 293.0, 146.0, 84.0, 68.0, 23.0, 18.0, 18.0, 4.0, 5.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.48046875, -2.388763427734375, -2.29705810546875, -2.205352783203125, -2.1136474609375, -2.021942138671875, -1.93023681640625, -1.838531494140625, -1.746826171875, -1.655120849609375, -1.56341552734375, -1.471710205078125, -1.3800048828125, -1.288299560546875, -1.19659423828125, -1.104888916015625, -1.01318359375, -0.921478271484375, -0.82977294921875, -0.738067626953125, -0.6463623046875, -0.554656982421875, -0.46295166015625, -0.371246337890625, -0.279541015625, -0.187835693359375, -0.09613037109375, -0.004425048828125, 0.0872802734375, 0.178985595703125, 0.27069091796875, 0.362396240234375, 0.4541015625, 0.545806884765625, 0.63751220703125, 0.729217529296875, 0.8209228515625, 0.912628173828125, 1.00433349609375, 1.096038818359375, 1.187744140625, 1.279449462890625, 1.37115478515625, 1.462860107421875, 1.5545654296875, 1.646270751953125, 1.73797607421875, 1.829681396484375, 1.92138671875, 2.013092041015625, 2.10479736328125, 2.196502685546875, 2.2882080078125, 2.379913330078125, 2.47161865234375, 2.563323974609375, 2.655029296875, 2.746734619140625, 2.83843994140625, 2.930145263671875, 3.0218505859375, 3.113555908203125, 3.20526123046875, 3.296966552734375, 3.388671875]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 3.0, 11.0, 23.0, 66.0, 116.0, 190.0, 215.0, 177.0, 111.0, 39.0, 19.0, 12.0, 8.0, 9.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.44921875, -2.3228759765625, -2.196533203125, -2.0701904296875, -1.94384765625, -1.8175048828125, -1.691162109375, -1.5648193359375, -1.4384765625, -1.3121337890625, -1.185791015625, -1.0594482421875, -0.93310546875, -0.8067626953125, -0.680419921875, -0.5540771484375, -0.427734375, -0.3013916015625, -0.175048828125, -0.0487060546875, 0.07763671875, 0.2039794921875, 0.330322265625, 0.4566650390625, 0.5830078125, 0.7093505859375, 0.835693359375, 0.9620361328125, 1.08837890625, 1.2147216796875, 1.341064453125, 1.4674072265625, 1.59375, 1.7200927734375, 1.846435546875, 1.9727783203125, 2.09912109375, 2.2254638671875, 2.351806640625, 2.4781494140625, 2.6044921875, 2.7308349609375, 2.857177734375, 2.9835205078125, 3.10986328125, 3.2362060546875, 3.362548828125, 3.4888916015625, 3.615234375, 3.7415771484375, 3.867919921875, 3.9942626953125, 4.12060546875, 4.2469482421875, 4.373291015625, 4.4996337890625, 4.6259765625, 4.7523193359375, 4.878662109375, 5.0050048828125, 5.13134765625, 5.2576904296875, 5.384033203125, 5.5103759765625, 5.63671875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 22.0, 144.0, 469.0, 318.0, 48.0, 9.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-162.7418975830078, -159.59458923339844, -156.447265625, -153.29995727539062, -150.1526336669922, -147.0053253173828, -143.85800170898438, -140.710693359375, -137.56338500976562, -134.41607666015625, -131.2687530517578, -128.12144470214844, -124.97412872314453, -121.82681274414062, -118.67949676513672, -115.53218078613281, -112.3848648071289, -109.237548828125, -106.0902328491211, -102.94291687011719, -99.79560852050781, -96.6482925415039, -93.5009765625, -90.3536605834961, -87.20634460449219, -84.05902862548828, -80.91171264648438, -77.764404296875, -74.6170883178711, -71.46977233886719, -68.32245635986328, -65.17514038085938, -62.02782440185547, -58.88050842285156, -55.73319625854492, -52.585880279541016, -49.438568115234375, -46.29125213623047, -43.14393615722656, -39.996620178222656, -36.849308013916016, -33.70199203491211, -30.55467987060547, -27.407363891601562, -24.26004981994629, -21.112735748291016, -17.96541976928711, -14.818105697631836, -11.670791625976562, -8.523477554321289, -5.376162528991699, -2.2288475036621094, 0.9184665679931641, 4.0657806396484375, 7.213096618652344, 10.360410690307617, 13.50772476196289, 16.655038833618164, 19.802352905273438, 22.949668884277344, 26.096982955932617, 29.24429702758789, 32.3916130065918, 35.53892517089844, 38.686241149902344]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 6.0, 6.0, 7.0, 6.0, 16.0, 16.0, 14.0, 22.0, 19.0, 11.0, 22.0, 30.0, 33.0, 40.0, 45.0, 48.0, 58.0, 50.0, 48.0, 51.0, 53.0, 47.0, 52.0, 41.0, 38.0, 45.0, 24.0, 31.0, 21.0, 19.0, 19.0, 17.0, 10.0, 10.0, 5.0, 4.0, 4.0, 9.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.56472396850586, -15.96933650970459, -15.373950004577637, -14.778562545776367, -14.183176040649414, -13.587788581848145, -12.992401123046875, -12.397014617919922, -11.801627159118652, -11.206239700317383, -10.61085319519043, -10.01546573638916, -9.42007827758789, -8.824691772460938, -8.229304313659668, -7.633917331695557, -7.038530349731445, -6.443143367767334, -5.847756385803223, -5.252368927001953, -4.656981945037842, -4.0615949630737305, -3.46620774269104, -2.8708205223083496, -2.2754335403442383, -1.6800464391708374, -1.0846593379974365, -0.48927223682403564, 0.10611486434936523, 0.7015018463134766, 1.296889066696167, 1.8922762870788574, 2.4876632690429688, 3.08305025100708, 3.6784374713897705, 4.273824691772461, 4.869211673736572, 5.464598655700684, 6.059986114501953, 6.6553730964660645, 7.250760078430176, 7.846147060394287, 8.441534042358398, 9.036921501159668, 9.632308959960938, 10.22769546508789, 10.82308292388916, 11.41847038269043, 12.013856887817383, 12.609244346618652, 13.204630851745605, 13.800018310546875, 14.395404815673828, 14.990792274475098, 15.586179733276367, 16.18156623840332, 16.776954650878906, 17.37234115600586, 17.967729568481445, 18.5631160736084, 19.15850257873535, 19.753890991210938, 20.34927749633789, 20.944664001464844, 21.540050506591797]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 3.0, 11.0, 8.0, 23.0, 30.0, 40.0, 65.0, 73.0, 138.0, 194.0, 369.0, 730.0, 1420.0, 3324.0, 9262.0, 49579.0, 4093969.0, 23942.0, 6153.0, 2393.0, 1069.0, 602.0, 322.0, 194.0, 120.0, 71.0, 63.0, 31.0, 22.0, 9.0, 13.0, 9.0, 10.0, 2.0, 7.0, 3.0, 7.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.76171875, -4.61883544921875, -4.4759521484375, -4.33306884765625, -4.190185546875, -4.04730224609375, -3.9044189453125, -3.76153564453125, -3.61865234375, -3.47576904296875, -3.3328857421875, -3.19000244140625, -3.047119140625, -2.90423583984375, -2.7613525390625, -2.61846923828125, -2.4755859375, -2.33270263671875, -2.1898193359375, -2.04693603515625, -1.904052734375, -1.76116943359375, -1.6182861328125, -1.47540283203125, -1.33251953125, -1.18963623046875, -1.0467529296875, -0.90386962890625, -0.760986328125, -0.61810302734375, -0.4752197265625, -0.33233642578125, -0.189453125, -0.04656982421875, 0.0963134765625, 0.23919677734375, 0.382080078125, 0.52496337890625, 0.6678466796875, 0.81072998046875, 0.95361328125, 1.09649658203125, 1.2393798828125, 1.38226318359375, 1.525146484375, 1.66802978515625, 1.8109130859375, 1.95379638671875, 2.0966796875, 2.23956298828125, 2.3824462890625, 2.52532958984375, 2.668212890625, 2.81109619140625, 2.9539794921875, 3.09686279296875, 3.23974609375, 3.38262939453125, 3.5255126953125, 3.66839599609375, 3.811279296875, 3.95416259765625, 4.0970458984375, 4.23992919921875, 4.3828125]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 4.0, 5.0, 5.0, 11.0, 9.0, 9.0, 20.0, 20.0, 27.0, 32.0, 39.0, 58.0, 53.0, 65.0, 61.0, 62.0, 83.0, 54.0, 68.0, 56.0, 40.0, 41.0, 39.0, 25.0, 35.0, 20.0, 18.0, 13.0, 6.0, 6.0, 4.0, 3.0, 5.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.95361328125, -0.9173049926757812, -0.8809967041015625, -0.8446884155273438, -0.808380126953125, -0.7720718383789062, -0.7357635498046875, -0.6994552612304688, -0.66314697265625, -0.6268386840820312, -0.5905303955078125, -0.5542221069335938, -0.517913818359375, -0.48160552978515625, -0.4452972412109375, -0.40898895263671875, -0.3726806640625, -0.33637237548828125, -0.3000640869140625, -0.26375579833984375, -0.227447509765625, -0.19113922119140625, -0.1548309326171875, -0.11852264404296875, -0.08221435546875, -0.04590606689453125, -0.0095977783203125, 0.02671051025390625, 0.063018798828125, 0.09932708740234375, 0.1356353759765625, 0.17194366455078125, 0.208251953125, 0.24456024169921875, 0.2808685302734375, 0.31717681884765625, 0.353485107421875, 0.38979339599609375, 0.4261016845703125, 0.46240997314453125, 0.49871826171875, 0.5350265502929688, 0.5713348388671875, 0.6076431274414062, 0.643951416015625, 0.6802597045898438, 0.7165679931640625, 0.7528762817382812, 0.7891845703125, 0.8254928588867188, 0.8618011474609375, 0.8981094360351562, 0.934417724609375, 0.9707260131835938, 1.0070343017578125, 1.0433425903320312, 1.07965087890625, 1.1159591674804688, 1.1522674560546875, 1.1885757446289062, 1.224884033203125, 1.2611923217773438, 1.2975006103515625, 1.3338088989257812, 1.3701171875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 7.0, 7.0, 9.0, 13.0, 11.0, 11.0, 14.0, 34.0, 46.0, 52.0, 87.0, 118.0, 159.0, 269.0, 364.0, 598.0, 925.0, 1679.0, 3008.0, 6455.0, 16747.0, 84031.0, 4020331.0, 37538.0, 10906.0, 4760.0, 2367.0, 1349.0, 793.0, 513.0, 323.0, 216.0, 155.0, 106.0, 80.0, 46.0, 43.0, 27.0, 23.0, 16.0, 10.0, 14.0, 8.0, 4.0, 7.0, 0.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.01953125, -3.89111328125, -3.7626953125, -3.63427734375, -3.505859375, -3.37744140625, -3.2490234375, -3.12060546875, -2.9921875, -2.86376953125, -2.7353515625, -2.60693359375, -2.478515625, -2.35009765625, -2.2216796875, -2.09326171875, -1.96484375, -1.83642578125, -1.7080078125, -1.57958984375, -1.451171875, -1.32275390625, -1.1943359375, -1.06591796875, -0.9375, -0.80908203125, -0.6806640625, -0.55224609375, -0.423828125, -0.29541015625, -0.1669921875, -0.03857421875, 0.08984375, 0.21826171875, 0.3466796875, 0.47509765625, 0.603515625, 0.73193359375, 0.8603515625, 0.98876953125, 1.1171875, 1.24560546875, 1.3740234375, 1.50244140625, 1.630859375, 1.75927734375, 1.8876953125, 2.01611328125, 2.14453125, 2.27294921875, 2.4013671875, 2.52978515625, 2.658203125, 2.78662109375, 2.9150390625, 3.04345703125, 3.171875, 3.30029296875, 3.4287109375, 3.55712890625, 3.685546875, 3.81396484375, 3.9423828125, 4.07080078125, 4.19921875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 2.0, 2.0, 5.0, 11.0, 18.0, 19.0, 29.0, 52.0, 341.0, 3439.0, 56.0, 32.0, 22.0, 8.0, 7.0, 4.0, 6.0, 6.0, 5.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.99755859375, -0.9632034301757812, -0.9288482666015625, -0.8944931030273438, -0.860137939453125, -0.8257827758789062, -0.7914276123046875, -0.7570724487304688, -0.72271728515625, -0.6883621215820312, -0.6540069580078125, -0.6196517944335938, -0.585296630859375, -0.5509414672851562, -0.5165863037109375, -0.48223114013671875, -0.4478759765625, -0.41352081298828125, -0.3791656494140625, -0.34481048583984375, -0.310455322265625, -0.27610015869140625, -0.2417449951171875, -0.20738983154296875, -0.17303466796875, -0.13867950439453125, -0.1043243408203125, -0.06996917724609375, -0.035614013671875, -0.00125885009765625, 0.0330963134765625, 0.06745147705078125, 0.101806640625, 0.13616180419921875, 0.1705169677734375, 0.20487213134765625, 0.239227294921875, 0.27358245849609375, 0.3079376220703125, 0.34229278564453125, 0.37664794921875, 0.41100311279296875, 0.4453582763671875, 0.47971343994140625, 0.514068603515625, 0.5484237670898438, 0.5827789306640625, 0.6171340942382812, 0.6514892578125, 0.6858444213867188, 0.7201995849609375, 0.7545547485351562, 0.788909912109375, 0.8232650756835938, 0.8576202392578125, 0.8919754028320312, 0.92633056640625, 0.9606857299804688, 0.9950408935546875, 1.0293960571289062, 1.063751220703125, 1.0981063842773438, 1.1324615478515625, 1.1668167114257812, 1.201171875]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 21.0, 39.0, 91.0, 206.0, 239.0, 196.0, 105.0, 66.0, 24.0, 14.0, 7.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.39384126663208, -6.150108337402344, -5.906374931335449, -5.662641525268555, -5.418908596038818, -5.175175666809082, -4.9314422607421875, -4.687708854675293, -4.443975925445557, -4.20024299621582, -3.956509590148926, -3.7127764225006104, -3.469043254852295, -3.2253100872039795, -2.981576919555664, -2.7378437519073486, -2.494110584259033, -2.2503774166107178, -2.0066442489624023, -1.762911081314087, -1.5191779136657715, -1.275444746017456, -1.0317115783691406, -0.7879784107208252, -0.5442452430725098, -0.30051207542419434, -0.056778907775878906, 0.18695425987243652, 0.43068742752075195, 0.6744205951690674, 0.9181537628173828, 1.1618869304656982, 1.4056196212768555, 1.649352788925171, 1.8930859565734863, 2.1368191242218018, 2.380552291870117, 2.6242854595184326, 2.868018627166748, 3.1117517948150635, 3.355484962463379, 3.5992181301116943, 3.8429512977600098, 4.086684226989746, 4.330417633056641, 4.574151039123535, 4.8178839683532715, 5.061616897583008, 5.305350303649902, 5.549083709716797, 5.792816638946533, 6.0365495681762695, 6.280282974243164, 6.524016380310059, 6.767749309539795, 7.011482238769531, 7.255215644836426, 7.49894905090332, 7.742681980133057, 7.986414909362793, 8.230148315429688, 8.473881721496582, 8.717615127563477, 8.961347579956055, 9.20508098602295]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 2.0, 11.0, 6.0, 5.0, 10.0, 15.0, 18.0, 16.0, 14.0, 21.0, 28.0, 28.0, 30.0, 36.0, 35.0, 44.0, 30.0, 46.0, 39.0, 59.0, 41.0, 43.0, 35.0, 48.0, 35.0, 42.0, 33.0, 32.0, 39.0, 31.0, 27.0, 20.0, 13.0, 11.0, 17.0, 7.0, 11.0, 10.0, 1.0, 6.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.346281051635742, -2.2719013690948486, -2.197521686553955, -2.1231422424316406, -2.048762559890747, -1.9743828773498535, -1.9000033140182495, -1.8256237506866455, -1.751244068145752, -1.6768643856048584, -1.6024848222732544, -1.5281052589416504, -1.4537255764007568, -1.3793458938598633, -1.3049663305282593, -1.2305867671966553, -1.1562070846557617, -1.0818274021148682, -1.0074478387832642, -0.9330682158470154, -0.8586885929107666, -0.7843089699745178, -0.709929347038269, -0.6355497241020203, -0.5611701011657715, -0.4867904782295227, -0.4124108552932739, -0.33803123235702515, -0.26365160942077637, -0.1892719864845276, -0.11489236354827881, -0.04051274061203003, 0.03386688232421875, 0.10824650526046753, 0.1826261281967163, 0.2570057511329651, 0.33138537406921387, 0.40576499700546265, 0.4801446199417114, 0.5545242428779602, 0.628903865814209, 0.7032834887504578, 0.7776631116867065, 0.8520427346229553, 0.9264223575592041, 1.0008020401000977, 1.0751816034317017, 1.1495611667633057, 1.2239408493041992, 1.2983205318450928, 1.3727000951766968, 1.4470796585083008, 1.5214593410491943, 1.595839023590088, 1.670218586921692, 1.744598150253296, 1.8189778327941895, 1.893357515335083, 1.967737078666687, 2.042116641998291, 2.1164963245391846, 2.190876007080078, 2.2652554512023926, 2.339635133743286, 2.4140148162841797]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 8.0, 12.0, 16.0, 22.0, 43.0, 64.0, 120.0, 191.0, 319.0, 535.0, 1020.0, 1889.0, 3768.0, 8104.0, 18634.0, 47976.0, 132487.0, 323040.0, 309211.0, 123371.0, 44908.0, 17735.0, 7438.0, 3576.0, 1767.0, 945.0, 581.0, 321.0, 175.0, 99.0, 61.0, 46.0, 26.0, 15.0, 13.0, 10.0, 4.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9716796875, -1.9080047607421875, -1.844329833984375, -1.7806549072265625, -1.71697998046875, -1.6533050537109375, -1.589630126953125, -1.5259552001953125, -1.4622802734375, -1.3986053466796875, -1.334930419921875, -1.2712554931640625, -1.20758056640625, -1.1439056396484375, -1.080230712890625, -1.0165557861328125, -0.952880859375, -0.8892059326171875, -0.825531005859375, -0.7618560791015625, -0.69818115234375, -0.6345062255859375, -0.570831298828125, -0.5071563720703125, -0.4434814453125, -0.3798065185546875, -0.316131591796875, -0.2524566650390625, -0.18878173828125, -0.1251068115234375, -0.061431884765625, 0.0022430419921875, 0.06591796875, 0.1295928955078125, 0.193267822265625, 0.2569427490234375, 0.32061767578125, 0.3842926025390625, 0.447967529296875, 0.5116424560546875, 0.5753173828125, 0.6389923095703125, 0.702667236328125, 0.7663421630859375, 0.83001708984375, 0.8936920166015625, 0.957366943359375, 1.0210418701171875, 1.084716796875, 1.1483917236328125, 1.212066650390625, 1.2757415771484375, 1.33941650390625, 1.4030914306640625, 1.466766357421875, 1.5304412841796875, 1.5941162109375, 1.6577911376953125, 1.721466064453125, 1.7851409912109375, 1.84881591796875, 1.9124908447265625, 1.976165771484375, 2.0398406982421875, 2.103515625]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 4.0, 5.0, 7.0, 13.0, 11.0, 9.0, 14.0, 16.0, 38.0, 29.0, 28.0, 44.0, 40.0, 45.0, 46.0, 61.0, 49.0, 57.0, 54.0, 62.0, 46.0, 44.0, 31.0, 40.0, 40.0, 34.0, 20.0, 31.0, 21.0, 9.0, 8.0, 15.0, 4.0, 5.0, 7.0, 4.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.95361328125, -0.9202651977539062, -0.8869171142578125, -0.8535690307617188, -0.820220947265625, -0.7868728637695312, -0.7535247802734375, -0.7201766967773438, -0.68682861328125, -0.6534805297851562, -0.6201324462890625, -0.5867843627929688, -0.553436279296875, -0.5200881958007812, -0.4867401123046875, -0.45339202880859375, -0.4200439453125, -0.38669586181640625, -0.3533477783203125, -0.31999969482421875, -0.286651611328125, -0.25330352783203125, -0.2199554443359375, -0.18660736083984375, -0.15325927734375, -0.11991119384765625, -0.0865631103515625, -0.05321502685546875, -0.019866943359375, 0.01348114013671875, 0.0468292236328125, 0.08017730712890625, 0.113525390625, 0.14687347412109375, 0.1802215576171875, 0.21356964111328125, 0.246917724609375, 0.28026580810546875, 0.3136138916015625, 0.34696197509765625, 0.38031005859375, 0.41365814208984375, 0.4470062255859375, 0.48035430908203125, 0.513702392578125, 0.5470504760742188, 0.5803985595703125, 0.6137466430664062, 0.6470947265625, 0.6804428100585938, 0.7137908935546875, 0.7471389770507812, 0.780487060546875, 0.8138351440429688, 0.8471832275390625, 0.8805313110351562, 0.91387939453125, 0.9472274780273438, 0.9805755615234375, 1.0139236450195312, 1.047271728515625, 1.0806198120117188, 1.1139678955078125, 1.1473159790039062, 1.1806640625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 5.0, 3.0, 1.0, 7.0, 6.0, 7.0, 15.0, 15.0, 22.0, 38.0, 68.0, 107.0, 187.0, 388.0, 927.0, 2962.0, 13700.0, 104296.0, 716800.0, 181686.0, 21092.0, 4028.0, 1187.0, 456.0, 192.0, 140.0, 71.0, 51.0, 24.0, 18.0, 11.0, 8.0, 10.0, 5.0, 5.0, 5.0, 7.0, 3.0, 5.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.01953125, -3.89239501953125, -3.7652587890625, -3.63812255859375, -3.510986328125, -3.38385009765625, -3.2567138671875, -3.12957763671875, -3.00244140625, -2.87530517578125, -2.7481689453125, -2.62103271484375, -2.493896484375, -2.36676025390625, -2.2396240234375, -2.11248779296875, -1.9853515625, -1.85821533203125, -1.7310791015625, -1.60394287109375, -1.476806640625, -1.34967041015625, -1.2225341796875, -1.09539794921875, -0.96826171875, -0.84112548828125, -0.7139892578125, -0.58685302734375, -0.459716796875, -0.33258056640625, -0.2054443359375, -0.07830810546875, 0.048828125, 0.17596435546875, 0.3031005859375, 0.43023681640625, 0.557373046875, 0.68450927734375, 0.8116455078125, 0.93878173828125, 1.06591796875, 1.19305419921875, 1.3201904296875, 1.44732666015625, 1.574462890625, 1.70159912109375, 1.8287353515625, 1.95587158203125, 2.0830078125, 2.21014404296875, 2.3372802734375, 2.46441650390625, 2.591552734375, 2.71868896484375, 2.8458251953125, 2.97296142578125, 3.10009765625, 3.22723388671875, 3.3543701171875, 3.48150634765625, 3.608642578125, 3.73577880859375, 3.8629150390625, 3.99005126953125, 4.1171875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 0.0, 4.0, 2.0, 4.0, 11.0, 4.0, 13.0, 13.0, 12.0, 13.0, 20.0, 11.0, 25.0, 27.0, 20.0, 31.0, 34.0, 40.0, 37.0, 37.0, 51.0, 44.0, 39.0, 43.0, 36.0, 36.0, 37.0, 45.0, 40.0, 36.0, 30.0, 27.0, 23.0, 24.0, 15.0, 23.0, 19.0, 14.0, 13.0, 10.0, 7.0, 12.0, 4.0, 2.0, 3.0, 5.0, 2.0, 4.0, 2.0, 1.0, 0.0, 4.0], "bins": [-4.046875, -3.93145751953125, -3.8160400390625, -3.70062255859375, -3.585205078125, -3.46978759765625, -3.3543701171875, -3.23895263671875, -3.12353515625, -3.00811767578125, -2.8927001953125, -2.77728271484375, -2.661865234375, -2.54644775390625, -2.4310302734375, -2.31561279296875, -2.2001953125, -2.08477783203125, -1.9693603515625, -1.85394287109375, -1.738525390625, -1.62310791015625, -1.5076904296875, -1.39227294921875, -1.27685546875, -1.16143798828125, -1.0460205078125, -0.93060302734375, -0.815185546875, -0.69976806640625, -0.5843505859375, -0.46893310546875, -0.353515625, -0.23809814453125, -0.1226806640625, -0.00726318359375, 0.108154296875, 0.22357177734375, 0.3389892578125, 0.45440673828125, 0.56982421875, 0.68524169921875, 0.8006591796875, 0.91607666015625, 1.031494140625, 1.14691162109375, 1.2623291015625, 1.37774658203125, 1.4931640625, 1.60858154296875, 1.7239990234375, 1.83941650390625, 1.954833984375, 2.07025146484375, 2.1856689453125, 2.30108642578125, 2.41650390625, 2.53192138671875, 2.6473388671875, 2.76275634765625, 2.878173828125, 2.99359130859375, 3.1090087890625, 3.22442626953125, 3.33984375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 5.0, 4.0, 6.0, 14.0, 15.0, 22.0, 51.0, 51.0, 62.0, 139.0, 328.0, 828.0, 2826.0, 15529.0, 343292.0, 656704.0, 23356.0, 3529.0, 970.0, 408.0, 169.0, 103.0, 50.0, 25.0, 23.0, 16.0, 10.0, 5.0, 4.0, 7.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.44921875, -3.3536376953125, -3.258056640625, -3.1624755859375, -3.06689453125, -2.9713134765625, -2.875732421875, -2.7801513671875, -2.6845703125, -2.5889892578125, -2.493408203125, -2.3978271484375, -2.30224609375, -2.2066650390625, -2.111083984375, -2.0155029296875, -1.919921875, -1.8243408203125, -1.728759765625, -1.6331787109375, -1.53759765625, -1.4420166015625, -1.346435546875, -1.2508544921875, -1.1552734375, -1.0596923828125, -0.964111328125, -0.8685302734375, -0.77294921875, -0.6773681640625, -0.581787109375, -0.4862060546875, -0.390625, -0.2950439453125, -0.199462890625, -0.1038818359375, -0.00830078125, 0.0872802734375, 0.182861328125, 0.2784423828125, 0.3740234375, 0.4696044921875, 0.565185546875, 0.6607666015625, 0.75634765625, 0.8519287109375, 0.947509765625, 1.0430908203125, 1.138671875, 1.2342529296875, 1.329833984375, 1.4254150390625, 1.52099609375, 1.6165771484375, 1.712158203125, 1.8077392578125, 1.9033203125, 1.9989013671875, 2.094482421875, 2.1900634765625, 2.28564453125, 2.3812255859375, 2.476806640625, 2.5723876953125, 2.66796875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 6.0, 8.0, 8.0, 11.0, 15.0, 27.0, 29.0, 54.0, 66.0, 86.0, 107.0, 119.0, 104.0, 92.0, 76.0, 41.0, 31.0, 37.0, 16.0, 14.0, 10.0, 10.0, 8.0, 5.0, 5.0, 5.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.00029087066650390625, -0.0002825148403644562, -0.0002741590142250061, -0.00026580318808555603, -0.00025744736194610596, -0.0002490915358066559, -0.0002407357096672058, -0.00023237988352775574, -0.00022402405738830566, -0.0002156682312488556, -0.00020731240510940552, -0.00019895657896995544, -0.00019060075283050537, -0.0001822449266910553, -0.00017388910055160522, -0.00016553327441215515, -0.00015717744827270508, -0.000148821622133255, -0.00014046579599380493, -0.00013210996985435486, -0.00012375414371490479, -0.00011539831757545471, -0.00010704249143600464, -9.868666529655457e-05, -9.033083915710449e-05, -8.197501301765442e-05, -7.361918687820435e-05, -6.526336073875427e-05, -5.69075345993042e-05, -4.8551708459854126e-05, -4.019588232040405e-05, -3.184005618095398e-05, -2.3484230041503906e-05, -1.5128403902053833e-05, -6.77257776260376e-06, 1.5832483768463135e-06, 9.939074516296387e-06, 1.829490065574646e-05, 2.6650726795196533e-05, 3.5006552934646606e-05, 4.336237907409668e-05, 5.171820521354675e-05, 6.0074031352996826e-05, 6.84298574924469e-05, 7.678568363189697e-05, 8.514150977134705e-05, 9.349733591079712e-05, 0.00010185316205024719, 0.00011020898818969727, 0.00011856481432914734, 0.0001269206404685974, 0.00013527646660804749, 0.00014363229274749756, 0.00015198811888694763, 0.0001603439450263977, 0.00016869977116584778, 0.00017705559730529785, 0.00018541142344474792, 0.000193767249584198, 0.00020212307572364807, 0.00021047890186309814, 0.00021883472800254822, 0.0002271905541419983, 0.00023554638028144836, 0.00024390220642089844]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 8.0, 7.0, 17.0, 22.0, 35.0, 58.0, 109.0, 215.0, 465.0, 1297.0, 5242.0, 48450.0, 876484.0, 105370.0, 7906.0, 1754.0, 585.0, 241.0, 122.0, 75.0, 38.0, 24.0, 15.0, 9.0, 8.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.46875, -4.36859130859375, -4.2684326171875, -4.16827392578125, -4.068115234375, -3.96795654296875, -3.8677978515625, -3.76763916015625, -3.66748046875, -3.56732177734375, -3.4671630859375, -3.36700439453125, -3.266845703125, -3.16668701171875, -3.0665283203125, -2.96636962890625, -2.8662109375, -2.76605224609375, -2.6658935546875, -2.56573486328125, -2.465576171875, -2.36541748046875, -2.2652587890625, -2.16510009765625, -2.06494140625, -1.96478271484375, -1.8646240234375, -1.76446533203125, -1.664306640625, -1.56414794921875, -1.4639892578125, -1.36383056640625, -1.263671875, -1.16351318359375, -1.0633544921875, -0.96319580078125, -0.863037109375, -0.76287841796875, -0.6627197265625, -0.56256103515625, -0.46240234375, -0.36224365234375, -0.2620849609375, -0.16192626953125, -0.061767578125, 0.03839111328125, 0.1385498046875, 0.23870849609375, 0.3388671875, 0.43902587890625, 0.5391845703125, 0.63934326171875, 0.739501953125, 0.83966064453125, 0.9398193359375, 1.03997802734375, 1.14013671875, 1.24029541015625, 1.3404541015625, 1.44061279296875, 1.540771484375, 1.64093017578125, 1.7410888671875, 1.84124755859375, 1.94140625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 7.0, 4.0, 9.0, 15.0, 23.0, 36.0, 83.0, 115.0, 163.0, 161.0, 128.0, 108.0, 67.0, 31.0, 28.0, 12.0, 11.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-3.78515625, -3.686370849609375, -3.58758544921875, -3.488800048828125, -3.3900146484375, -3.291229248046875, -3.19244384765625, -3.093658447265625, -2.994873046875, -2.896087646484375, -2.79730224609375, -2.698516845703125, -2.5997314453125, -2.500946044921875, -2.40216064453125, -2.303375244140625, -2.20458984375, -2.105804443359375, -2.00701904296875, -1.908233642578125, -1.8094482421875, -1.710662841796875, -1.61187744140625, -1.513092041015625, -1.414306640625, -1.315521240234375, -1.21673583984375, -1.117950439453125, -1.0191650390625, -0.920379638671875, -0.82159423828125, -0.722808837890625, -0.6240234375, -0.525238037109375, -0.42645263671875, -0.327667236328125, -0.2288818359375, -0.130096435546875, -0.03131103515625, 0.067474365234375, 0.166259765625, 0.265045166015625, 0.36383056640625, 0.462615966796875, 0.5614013671875, 0.660186767578125, 0.75897216796875, 0.857757568359375, 0.95654296875, 1.055328369140625, 1.15411376953125, 1.252899169921875, 1.3516845703125, 1.450469970703125, 1.54925537109375, 1.648040771484375, 1.746826171875, 1.845611572265625, 1.94439697265625, 2.043182373046875, 2.1419677734375, 2.240753173828125, 2.33953857421875, 2.438323974609375, 2.537109375]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 4.0, 9.0, 24.0, 93.0, 269.0, 346.0, 185.0, 49.0, 16.0, 7.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-113.35630798339844, -111.19064331054688, -109.02497100830078, -106.85930633544922, -104.69363403320312, -102.52796936035156, -100.36229705810547, -98.1966323852539, -96.03096008300781, -93.86529541015625, -91.69962310791016, -89.5339584350586, -87.3682861328125, -85.20262145996094, -83.03694915771484, -80.87128448486328, -78.70561981201172, -76.53995513916016, -74.37428283691406, -72.2086181640625, -70.0429458618164, -67.87728118896484, -65.71160888671875, -63.54594421386719, -61.38027572631836, -59.21460723876953, -57.0489387512207, -54.883270263671875, -52.71760559082031, -50.55193328857422, -48.386268615722656, -46.22060012817383, -44.054927825927734, -41.889259338378906, -39.72359085083008, -37.55792236328125, -35.39225769042969, -33.226585388183594, -31.06092071533203, -28.895252227783203, -26.729583740234375, -24.563915252685547, -22.39824676513672, -20.232580184936523, -18.066911697387695, -15.901243209838867, -13.735575675964355, -11.569908142089844, -9.404239654541016, -7.238571643829346, -5.072903633117676, -2.907235622406006, -0.7415676116943359, 1.4241008758544922, 3.589768409729004, 5.755435943603516, 7.921104431152344, 10.086772918701172, 12.252440452575684, 14.418107986450195, 16.583776473999023, 18.74944496154785, 20.915111541748047, 23.080780029296875, 25.246448516845703]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 7.0, 1.0, 11.0, 11.0, 19.0, 15.0, 22.0, 21.0, 29.0, 34.0, 42.0, 37.0, 37.0, 47.0, 39.0, 59.0, 63.0, 60.0, 53.0, 45.0, 55.0, 43.0, 29.0, 39.0, 31.0, 29.0, 18.0, 21.0, 9.0, 18.0, 14.0, 8.0, 6.0, 4.0, 6.0, 4.0, 7.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-23.170543670654297, -22.52720069885254, -21.88385581970215, -21.24051284790039, -20.597169876098633, -19.953826904296875, -19.310482025146484, -18.667139053344727, -18.02379608154297, -17.38045310974121, -16.73710823059082, -16.093765258789062, -15.450422286987305, -14.80707836151123, -14.163734436035156, -13.520391464233398, -12.877047538757324, -12.23370361328125, -11.590360641479492, -10.947016716003418, -10.30367374420166, -9.660329818725586, -9.016986846923828, -8.373642921447754, -7.730299472808838, -7.086956024169922, -6.443612575531006, -5.80026912689209, -5.156925201416016, -4.513582229614258, -3.8702383041381836, -3.2268948554992676, -2.5835514068603516, -1.9402079582214355, -1.29686439037323, -0.6535208225250244, -0.010177373886108398, 0.6331660747528076, 1.2765097618103027, 1.9198532104492188, 2.5631966590881348, 3.206540107727051, 3.849883556365967, 4.493227005004883, 5.136570930480957, 5.779913902282715, 6.423257827758789, 7.066601276397705, 7.709944725036621, 8.353288650512695, 8.996631622314453, 9.639975547790527, 10.283318519592285, 10.92666244506836, 11.570005416870117, 12.213349342346191, 12.856693267822266, 13.50003719329834, 14.143380165100098, 14.786724090576172, 15.43006706237793, 16.073410034179688, 16.716754913330078, 17.360097885131836, 18.003440856933594]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 3.0, 7.0, 10.0, 24.0, 26.0, 32.0, 57.0, 77.0, 131.0, 229.0, 368.0, 616.0, 1228.0, 2837.0, 9861.0, 73895.0, 4056716.0, 37012.0, 6598.0, 2139.0, 985.0, 567.0, 281.0, 189.0, 123.0, 82.0, 63.0, 37.0, 25.0, 18.0, 19.0, 5.0, 8.0, 1.0, 4.0, 6.0, 7.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.609375, -3.46124267578125, -3.3131103515625, -3.16497802734375, -3.016845703125, -2.86871337890625, -2.7205810546875, -2.57244873046875, -2.42431640625, -2.27618408203125, -2.1280517578125, -1.97991943359375, -1.831787109375, -1.68365478515625, -1.5355224609375, -1.38739013671875, -1.2392578125, -1.09112548828125, -0.9429931640625, -0.79486083984375, -0.646728515625, -0.49859619140625, -0.3504638671875, -0.20233154296875, -0.05419921875, 0.09393310546875, 0.2420654296875, 0.39019775390625, 0.538330078125, 0.68646240234375, 0.8345947265625, 0.98272705078125, 1.130859375, 1.27899169921875, 1.4271240234375, 1.57525634765625, 1.723388671875, 1.87152099609375, 2.0196533203125, 2.16778564453125, 2.31591796875, 2.46405029296875, 2.6121826171875, 2.76031494140625, 2.908447265625, 3.05657958984375, 3.2047119140625, 3.35284423828125, 3.5009765625, 3.64910888671875, 3.7972412109375, 3.94537353515625, 4.093505859375, 4.24163818359375, 4.3897705078125, 4.53790283203125, 4.68603515625, 4.83416748046875, 4.9822998046875, 5.13043212890625, 5.278564453125, 5.42669677734375, 5.5748291015625, 5.72296142578125, 5.87109375]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 5.0, 9.0, 9.0, 14.0, 16.0, 37.0, 44.0, 59.0, 76.0, 102.0, 99.0, 101.0, 89.0, 80.0, 76.0, 56.0, 39.0, 39.0, 16.0, 10.0, 10.0, 9.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.791015625, -1.7340545654296875, -1.677093505859375, -1.6201324462890625, -1.56317138671875, -1.5062103271484375, -1.449249267578125, -1.3922882080078125, -1.3353271484375, -1.2783660888671875, -1.221405029296875, -1.1644439697265625, -1.10748291015625, -1.0505218505859375, -0.993560791015625, -0.9365997314453125, -0.879638671875, -0.8226776123046875, -0.765716552734375, -0.7087554931640625, -0.65179443359375, -0.5948333740234375, -0.537872314453125, -0.4809112548828125, -0.4239501953125, -0.3669891357421875, -0.310028076171875, -0.2530670166015625, -0.19610595703125, -0.1391448974609375, -0.082183837890625, -0.0252227783203125, 0.03173828125, 0.0886993408203125, 0.145660400390625, 0.2026214599609375, 0.25958251953125, 0.3165435791015625, 0.373504638671875, 0.4304656982421875, 0.4874267578125, 0.5443878173828125, 0.601348876953125, 0.6583099365234375, 0.71527099609375, 0.7722320556640625, 0.829193115234375, 0.8861541748046875, 0.943115234375, 1.0000762939453125, 1.057037353515625, 1.1139984130859375, 1.17095947265625, 1.2279205322265625, 1.284881591796875, 1.3418426513671875, 1.3988037109375, 1.4557647705078125, 1.512725830078125, 1.5696868896484375, 1.62664794921875, 1.6836090087890625, 1.740570068359375, 1.7975311279296875, 1.8544921875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 4.0, 4.0, 9.0, 6.0, 16.0, 17.0, 26.0, 45.0, 47.0, 56.0, 109.0, 131.0, 201.0, 294.0, 381.0, 586.0, 992.0, 1854.0, 3736.0, 7788.0, 20004.0, 78790.0, 3807073.0, 214495.0, 34566.0, 11633.0, 5038.0, 2505.0, 1412.0, 792.0, 489.0, 337.0, 232.0, 161.0, 129.0, 92.0, 70.0, 45.0, 34.0, 29.0, 16.0, 13.0, 8.0, 8.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-2.71875, -2.633056640625, -2.54736328125, -2.461669921875, -2.3759765625, -2.290283203125, -2.20458984375, -2.118896484375, -2.033203125, -1.947509765625, -1.86181640625, -1.776123046875, -1.6904296875, -1.604736328125, -1.51904296875, -1.433349609375, -1.34765625, -1.261962890625, -1.17626953125, -1.090576171875, -1.0048828125, -0.919189453125, -0.83349609375, -0.747802734375, -0.662109375, -0.576416015625, -0.49072265625, -0.405029296875, -0.3193359375, -0.233642578125, -0.14794921875, -0.062255859375, 0.0234375, 0.109130859375, 0.19482421875, 0.280517578125, 0.3662109375, 0.451904296875, 0.53759765625, 0.623291015625, 0.708984375, 0.794677734375, 0.88037109375, 0.966064453125, 1.0517578125, 1.137451171875, 1.22314453125, 1.308837890625, 1.39453125, 1.480224609375, 1.56591796875, 1.651611328125, 1.7373046875, 1.822998046875, 1.90869140625, 1.994384765625, 2.080078125, 2.165771484375, 2.25146484375, 2.337158203125, 2.4228515625, 2.508544921875, 2.59423828125, 2.679931640625, 2.765625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 8.0, 11.0, 10.0, 8.0, 12.0, 19.0, 35.0, 56.0, 90.0, 213.0, 3031.0, 269.0, 101.0, 70.0, 41.0, 18.0, 17.0, 13.0, 11.0, 5.0, 9.0, 4.0, 7.0, 2.0, 4.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.97119140625, -0.9315872192382812, -0.8919830322265625, -0.8523788452148438, -0.812774658203125, -0.7731704711914062, -0.7335662841796875, -0.6939620971679688, -0.65435791015625, -0.6147537231445312, -0.5751495361328125, -0.5355453491210938, -0.495941162109375, -0.45633697509765625, -0.4167327880859375, -0.37712860107421875, -0.3375244140625, -0.29792022705078125, -0.2583160400390625, -0.21871185302734375, -0.179107666015625, -0.13950347900390625, -0.0998992919921875, -0.06029510498046875, -0.02069091796875, 0.01891326904296875, 0.0585174560546875, 0.09812164306640625, 0.137725830078125, 0.17733001708984375, 0.2169342041015625, 0.25653839111328125, 0.296142578125, 0.33574676513671875, 0.3753509521484375, 0.41495513916015625, 0.454559326171875, 0.49416351318359375, 0.5337677001953125, 0.5733718872070312, 0.61297607421875, 0.6525802612304688, 0.6921844482421875, 0.7317886352539062, 0.771392822265625, 0.8109970092773438, 0.8506011962890625, 0.8902053833007812, 0.9298095703125, 0.9694137573242188, 1.0090179443359375, 1.0486221313476562, 1.088226318359375, 1.1278305053710938, 1.1674346923828125, 1.2070388793945312, 1.24664306640625, 1.2862472534179688, 1.3258514404296875, 1.3654556274414062, 1.405059814453125, 1.4446640014648438, 1.4842681884765625, 1.5238723754882812, 1.5634765625]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 3.0, 11.0, 16.0, 31.0, 35.0, 66.0, 86.0, 102.0, 118.0, 105.0, 99.0, 83.0, 64.0, 42.0, 28.0, 25.0, 24.0, 16.0, 15.0, 13.0, 5.0, 2.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5456020832061768, -3.344350814819336, -3.143099784851074, -2.9418485164642334, -2.7405972480773926, -2.539346218109131, -2.33809494972229, -2.136843681335449, -1.9355926513671875, -1.7343415021896362, -1.533090353012085, -1.3318390846252441, -1.1305879354476929, -0.9293367862701416, -0.7280855178833008, -0.5268343687057495, -0.32558321952819824, -0.12433204054832458, 0.07691913843154907, 0.2781703472137451, 0.4794214963912964, 0.6806726455688477, 0.8819239139556885, 1.0831750631332397, 1.284426212310791, 1.4856773614883423, 1.6869285106658936, 1.8881797790527344, 2.089430809020996, 2.290682077407837, 2.4919333457946777, 2.6931843757629395, 2.8944358825683594, 3.0956871509552, 3.296938180923462, 3.4981894493103027, 3.6994404792785645, 3.9006917476654053, 4.101943016052246, 4.303194046020508, 4.5044450759887695, 4.705696105957031, 4.906947612762451, 5.108198642730713, 5.309449672698975, 5.5107011795043945, 5.711952209472656, 5.913203239440918, 6.114454746246338, 6.3157057762146, 6.5169572830200195, 6.718208312988281, 6.919459342956543, 7.120710372924805, 7.321961879730225, 7.523212909698486, 7.724464416503906, 7.925715446472168, 8.12696647644043, 8.328218460083008, 8.52946949005127, 8.730720520019531, 8.931971549987793, 9.133222579956055, 9.334473609924316]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 6.0, 1.0, 1.0, 3.0, 7.0, 3.0, 7.0, 16.0, 5.0, 10.0, 14.0, 11.0, 13.0, 19.0, 14.0, 25.0, 21.0, 20.0, 34.0, 29.0, 22.0, 32.0, 27.0, 25.0, 32.0, 37.0, 34.0, 30.0, 34.0, 38.0, 44.0, 34.0, 30.0, 34.0, 23.0, 37.0, 32.0, 33.0, 22.0, 12.0, 28.0, 27.0, 16.0, 11.0, 13.0, 11.0, 9.0, 5.0, 3.0, 5.0, 4.0, 6.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.8851871490478516, -3.7598843574523926, -3.6345813274383545, -3.5092785358428955, -3.3839755058288574, -3.2586727142333984, -3.1333699226379395, -3.0080671310424805, -2.8827641010284424, -2.7574613094329834, -2.6321582794189453, -2.5068554878234863, -2.3815526962280273, -2.2562496662139893, -2.1309468746185303, -2.005643844604492, -1.8803410530090332, -1.7550381422042847, -1.6297352313995361, -1.5044324398040771, -1.3791295289993286, -1.25382661819458, -1.128523826599121, -1.0032209157943726, -0.877918004989624, -0.7526150941848755, -0.6273122429847717, -0.502009391784668, -0.37670648097991943, -0.2514035701751709, -0.12610071897506714, -0.0007978677749633789, 0.12450456619262695, 0.2498074471950531, 0.37511032819747925, 0.500413179397583, 0.6257160902023315, 0.7510190010070801, 0.8763218522071838, 1.0016247034072876, 1.1269276142120361, 1.2522305250167847, 1.3775334358215332, 1.5028362274169922, 1.6281391382217407, 1.7534420490264893, 1.8787448406219482, 2.0040478706359863, 2.1293506622314453, 2.2546534538269043, 2.3799564838409424, 2.5052592754364014, 2.6305623054504395, 2.7558650970458984, 2.8811678886413574, 3.0064706802368164, 3.1317737102508545, 3.2570765018463135, 3.3823795318603516, 3.5076823234558105, 3.6329851150512695, 3.7582881450653076, 3.8835909366607666, 4.008893966674805, 4.134196758270264]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 3.0, 2.0, 8.0, 11.0, 9.0, 11.0, 21.0, 29.0, 44.0, 51.0, 100.0, 139.0, 256.0, 489.0, 953.0, 1776.0, 3909.0, 10122.0, 28554.0, 92678.0, 306794.0, 397029.0, 140079.0, 41239.0, 13941.0, 5521.0, 2235.0, 1109.0, 606.0, 324.0, 192.0, 116.0, 80.0, 35.0, 31.0, 18.0, 12.0, 15.0, 3.0, 4.0, 3.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0], "bins": [-3.1015625, -3.020294189453125, -2.93902587890625, -2.857757568359375, -2.7764892578125, -2.695220947265625, -2.61395263671875, -2.532684326171875, -2.451416015625, -2.370147705078125, -2.28887939453125, -2.207611083984375, -2.1263427734375, -2.045074462890625, -1.96380615234375, -1.882537841796875, -1.80126953125, -1.720001220703125, -1.63873291015625, -1.557464599609375, -1.4761962890625, -1.394927978515625, -1.31365966796875, -1.232391357421875, -1.151123046875, -1.069854736328125, -0.98858642578125, -0.907318115234375, -0.8260498046875, -0.744781494140625, -0.66351318359375, -0.582244873046875, -0.5009765625, -0.419708251953125, -0.33843994140625, -0.257171630859375, -0.1759033203125, -0.094635009765625, -0.01336669921875, 0.067901611328125, 0.149169921875, 0.230438232421875, 0.31170654296875, 0.392974853515625, 0.4742431640625, 0.555511474609375, 0.63677978515625, 0.718048095703125, 0.79931640625, 0.880584716796875, 0.96185302734375, 1.043121337890625, 1.1243896484375, 1.205657958984375, 1.28692626953125, 1.368194580078125, 1.449462890625, 1.530731201171875, 1.61199951171875, 1.693267822265625, 1.7745361328125, 1.855804443359375, 1.93707275390625, 2.018341064453125, 2.099609375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 1.0, 3.0, 5.0, 9.0, 9.0, 5.0, 11.0, 13.0, 22.0, 35.0, 36.0, 42.0, 43.0, 73.0, 81.0, 74.0, 75.0, 83.0, 60.0, 57.0, 51.0, 47.0, 51.0, 30.0, 24.0, 14.0, 12.0, 14.0, 10.0, 9.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.599609375, -1.5506591796875, -1.501708984375, -1.4527587890625, -1.40380859375, -1.3548583984375, -1.305908203125, -1.2569580078125, -1.2080078125, -1.1590576171875, -1.110107421875, -1.0611572265625, -1.01220703125, -0.9632568359375, -0.914306640625, -0.8653564453125, -0.81640625, -0.7674560546875, -0.718505859375, -0.6695556640625, -0.62060546875, -0.5716552734375, -0.522705078125, -0.4737548828125, -0.4248046875, -0.3758544921875, -0.326904296875, -0.2779541015625, -0.22900390625, -0.1800537109375, -0.131103515625, -0.0821533203125, -0.033203125, 0.0157470703125, 0.064697265625, 0.1136474609375, 0.16259765625, 0.2115478515625, 0.260498046875, 0.3094482421875, 0.3583984375, 0.4073486328125, 0.456298828125, 0.5052490234375, 0.55419921875, 0.6031494140625, 0.652099609375, 0.7010498046875, 0.75, 0.7989501953125, 0.847900390625, 0.8968505859375, 0.94580078125, 0.9947509765625, 1.043701171875, 1.0926513671875, 1.1416015625, 1.1905517578125, 1.239501953125, 1.2884521484375, 1.33740234375, 1.3863525390625, 1.435302734375, 1.4842529296875, 1.533203125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 9.0, 6.0, 6.0, 6.0, 7.0, 8.0, 8.0, 17.0, 35.0, 20.0, 43.0, 63.0, 90.0, 114.0, 225.0, 350.0, 576.0, 1168.0, 2511.0, 6446.0, 22367.0, 108384.0, 535327.0, 297693.0, 52321.0, 12619.0, 4208.0, 1756.0, 864.0, 506.0, 255.0, 167.0, 103.0, 82.0, 52.0, 33.0, 28.0, 34.0, 11.0, 12.0, 9.0, 3.0, 5.0, 3.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.326171875, -3.22772216796875, -3.1292724609375, -3.03082275390625, -2.932373046875, -2.83392333984375, -2.7354736328125, -2.63702392578125, -2.53857421875, -2.44012451171875, -2.3416748046875, -2.24322509765625, -2.144775390625, -2.04632568359375, -1.9478759765625, -1.84942626953125, -1.7509765625, -1.65252685546875, -1.5540771484375, -1.45562744140625, -1.357177734375, -1.25872802734375, -1.1602783203125, -1.06182861328125, -0.96337890625, -0.86492919921875, -0.7664794921875, -0.66802978515625, -0.569580078125, -0.47113037109375, -0.3726806640625, -0.27423095703125, -0.17578125, -0.07733154296875, 0.0211181640625, 0.11956787109375, 0.218017578125, 0.31646728515625, 0.4149169921875, 0.51336669921875, 0.61181640625, 0.71026611328125, 0.8087158203125, 0.90716552734375, 1.005615234375, 1.10406494140625, 1.2025146484375, 1.30096435546875, 1.3994140625, 1.49786376953125, 1.5963134765625, 1.69476318359375, 1.793212890625, 1.89166259765625, 1.9901123046875, 2.08856201171875, 2.18701171875, 2.28546142578125, 2.3839111328125, 2.48236083984375, 2.580810546875, 2.67926025390625, 2.7777099609375, 2.87615966796875, 2.974609375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 2.0, 6.0, 7.0, 6.0, 11.0, 17.0, 19.0, 23.0, 28.0, 39.0, 44.0, 51.0, 48.0, 56.0, 71.0, 77.0, 62.0, 48.0, 48.0, 66.0, 54.0, 47.0, 33.0, 28.0, 37.0, 27.0, 10.0, 12.0, 6.0, 4.0, 6.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.29296875, -6.10784912109375, -5.9227294921875, -5.73760986328125, -5.552490234375, -5.36737060546875, -5.1822509765625, -4.99713134765625, -4.81201171875, -4.62689208984375, -4.4417724609375, -4.25665283203125, -4.071533203125, -3.88641357421875, -3.7012939453125, -3.51617431640625, -3.3310546875, -3.14593505859375, -2.9608154296875, -2.77569580078125, -2.590576171875, -2.40545654296875, -2.2203369140625, -2.03521728515625, -1.85009765625, -1.66497802734375, -1.4798583984375, -1.29473876953125, -1.109619140625, -0.92449951171875, -0.7393798828125, -0.55426025390625, -0.369140625, -0.18402099609375, 0.0010986328125, 0.18621826171875, 0.371337890625, 0.55645751953125, 0.7415771484375, 0.92669677734375, 1.11181640625, 1.29693603515625, 1.4820556640625, 1.66717529296875, 1.852294921875, 2.03741455078125, 2.2225341796875, 2.40765380859375, 2.5927734375, 2.77789306640625, 2.9630126953125, 3.14813232421875, 3.333251953125, 3.51837158203125, 3.7034912109375, 3.88861083984375, 4.07373046875, 4.25885009765625, 4.4439697265625, 4.62908935546875, 4.814208984375, 4.99932861328125, 5.1844482421875, 5.36956787109375, 5.5546875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 6.0, 7.0, 10.0, 11.0, 17.0, 20.0, 58.0, 135.0, 316.0, 930.0, 4832.0, 97352.0, 902893.0, 37901.0, 2998.0, 642.0, 221.0, 100.0, 46.0, 27.0, 16.0, 6.0, 6.0, 5.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.314453125, -3.238037109375, -3.16162109375, -3.085205078125, -3.0087890625, -2.932373046875, -2.85595703125, -2.779541015625, -2.703125, -2.626708984375, -2.55029296875, -2.473876953125, -2.3974609375, -2.321044921875, -2.24462890625, -2.168212890625, -2.091796875, -2.015380859375, -1.93896484375, -1.862548828125, -1.7861328125, -1.709716796875, -1.63330078125, -1.556884765625, -1.48046875, -1.404052734375, -1.32763671875, -1.251220703125, -1.1748046875, -1.098388671875, -1.02197265625, -0.945556640625, -0.869140625, -0.792724609375, -0.71630859375, -0.639892578125, -0.5634765625, -0.487060546875, -0.41064453125, -0.334228515625, -0.2578125, -0.181396484375, -0.10498046875, -0.028564453125, 0.0478515625, 0.124267578125, 0.20068359375, 0.277099609375, 0.353515625, 0.429931640625, 0.50634765625, 0.582763671875, 0.6591796875, 0.735595703125, 0.81201171875, 0.888427734375, 0.96484375, 1.041259765625, 1.11767578125, 1.194091796875, 1.2705078125, 1.346923828125, 1.42333984375, 1.499755859375, 1.576171875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 6.0, 6.0, 10.0, 15.0, 19.0, 21.0, 35.0, 47.0, 74.0, 85.0, 100.0, 109.0, 106.0, 75.0, 54.0, 73.0, 48.0, 29.0, 24.0, 19.0, 10.0, 11.0, 4.0, 6.0, 5.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0002689361572265625, -0.0002620033919811249, -0.00025507062673568726, -0.00024813786149024963, -0.000241205096244812, -0.0002342723309993744, -0.00022733956575393677, -0.00022040680050849915, -0.00021347403526306152, -0.0002065412700176239, -0.00019960850477218628, -0.00019267573952674866, -0.00018574297428131104, -0.0001788102090358734, -0.0001718774437904358, -0.00016494467854499817, -0.00015801191329956055, -0.00015107914805412292, -0.0001441463828086853, -0.00013721361756324768, -0.00013028085231781006, -0.00012334808707237244, -0.00011641532182693481, -0.00010948255658149719, -0.00010254979133605957, -9.561702609062195e-05, -8.868426084518433e-05, -8.17514955997467e-05, -7.481873035430908e-05, -6.788596510887146e-05, -6.095319986343384e-05, -5.4020434617996216e-05, -4.7087669372558594e-05, -4.015490412712097e-05, -3.322213888168335e-05, -2.6289373636245728e-05, -1.9356608390808105e-05, -1.2423843145370483e-05, -5.491077899932861e-06, 1.4416873455047607e-06, 8.374452590942383e-06, 1.5307217836380005e-05, 2.2239983081817627e-05, 2.917274832725525e-05, 3.610551357269287e-05, 4.303827881813049e-05, 4.9971044063568115e-05, 5.690380930900574e-05, 6.383657455444336e-05, 7.076933979988098e-05, 7.77021050453186e-05, 8.463487029075623e-05, 9.156763553619385e-05, 9.850040078163147e-05, 0.00010543316602706909, 0.00011236593127250671, 0.00011929869651794434, 0.00012623146176338196, 0.00013316422700881958, 0.0001400969922542572, 0.00014702975749969482, 0.00015396252274513245, 0.00016089528799057007, 0.0001678280532360077, 0.0001747608184814453]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 5.0, 3.0, 5.0, 4.0, 5.0, 11.0, 10.0, 10.0, 16.0, 24.0, 47.0, 51.0, 84.0, 172.0, 311.0, 540.0, 1126.0, 3000.0, 10576.0, 64159.0, 604797.0, 320168.0, 32473.0, 6865.0, 2186.0, 875.0, 426.0, 226.0, 125.0, 79.0, 42.0, 43.0, 21.0, 24.0, 16.0, 5.0, 8.0, 7.0, 3.0, 4.0, 1.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.2529296875, -1.2109375, -1.1689453125, -1.126953125, -1.0849609375, -1.04296875, -1.0009765625, -0.958984375, -0.9169921875, -0.875, -0.8330078125, -0.791015625, -0.7490234375, -0.70703125, -0.6650390625, -0.623046875, -0.5810546875, -0.5390625, -0.4970703125, -0.455078125, -0.4130859375, -0.37109375, -0.3291015625, -0.287109375, -0.2451171875, -0.203125, -0.1611328125, -0.119140625, -0.0771484375, -0.03515625, 0.0068359375, 0.048828125, 0.0908203125, 0.1328125, 0.1748046875, 0.216796875, 0.2587890625, 0.30078125, 0.3427734375, 0.384765625, 0.4267578125, 0.46875, 0.5107421875, 0.552734375, 0.5947265625, 0.63671875, 0.6787109375, 0.720703125, 0.7626953125, 0.8046875, 0.8466796875, 0.888671875, 0.9306640625, 0.97265625, 1.0146484375, 1.056640625, 1.0986328125, 1.140625, 1.1826171875, 1.224609375, 1.2666015625, 1.30859375, 1.3505859375, 1.392578125, 1.4345703125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 4.0, 0.0, 2.0, 5.0, 8.0, 11.0, 2.0, 10.0, 17.0, 18.0, 29.0, 35.0, 52.0, 61.0, 82.0, 90.0, 91.0, 84.0, 70.0, 75.0, 51.0, 46.0, 41.0, 29.0, 26.0, 16.0, 10.0, 8.0, 5.0, 9.0, 7.0, 2.0, 6.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4423828125, -1.402130126953125, -1.36187744140625, -1.321624755859375, -1.2813720703125, -1.241119384765625, -1.20086669921875, -1.160614013671875, -1.120361328125, -1.080108642578125, -1.03985595703125, -0.999603271484375, -0.9593505859375, -0.919097900390625, -0.87884521484375, -0.838592529296875, -0.79833984375, -0.758087158203125, -0.71783447265625, -0.677581787109375, -0.6373291015625, -0.597076416015625, -0.55682373046875, -0.516571044921875, -0.476318359375, -0.436065673828125, -0.39581298828125, -0.355560302734375, -0.3153076171875, -0.275054931640625, -0.23480224609375, -0.194549560546875, -0.154296875, -0.114044189453125, -0.07379150390625, -0.033538818359375, 0.0067138671875, 0.046966552734375, 0.08721923828125, 0.127471923828125, 0.167724609375, 0.207977294921875, 0.24822998046875, 0.288482666015625, 0.3287353515625, 0.368988037109375, 0.40924072265625, 0.449493408203125, 0.48974609375, 0.529998779296875, 0.57025146484375, 0.610504150390625, 0.6507568359375, 0.691009521484375, 0.73126220703125, 0.771514892578125, 0.811767578125, 0.852020263671875, 0.89227294921875, 0.932525634765625, 0.9727783203125, 1.013031005859375, 1.05328369140625, 1.093536376953125, 1.1337890625]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 12.0, 23.0, 44.0, 76.0, 154.0, 198.0, 169.0, 154.0, 83.0, 39.0, 29.0, 10.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.013925552368164, -23.882144927978516, -22.750364303588867, -21.61858367919922, -20.48680305480957, -19.355022430419922, -18.223241806030273, -17.091461181640625, -15.959680557250977, -14.827899932861328, -13.69611930847168, -12.564338684082031, -11.432558059692383, -10.300777435302734, -9.168996810913086, -8.037216186523438, -6.905435562133789, -5.773654937744141, -4.641874313354492, -3.5100936889648438, -2.3783130645751953, -1.2465324401855469, -0.11475181579589844, 1.01702880859375, 2.1488094329833984, 3.280590057373047, 4.412370681762695, 5.544151306152344, 6.675931930541992, 7.807712554931641, 8.939493179321289, 10.071273803710938, 11.203056335449219, 12.334836959838867, 13.466617584228516, 14.598398208618164, 15.730178833007812, 16.86195945739746, 17.99374008178711, 19.125520706176758, 20.257301330566406, 21.389081954956055, 22.520862579345703, 23.65264320373535, 24.784423828125, 25.91620445251465, 27.047985076904297, 28.179765701293945, 29.311546325683594, 30.443326950073242, 31.57510757446289, 32.706886291503906, 33.83866882324219, 34.97045135498047, 36.102230072021484, 37.2340087890625, 38.36579132080078, 39.49757385253906, 40.62935256958008, 41.761131286621094, 42.892913818359375, 44.024696350097656, 45.15647506713867, 46.28825378417969, 47.42003631591797]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 5.0, 5.0, 8.0, 8.0, 9.0, 18.0, 15.0, 20.0, 21.0, 22.0, 35.0, 32.0, 44.0, 47.0, 47.0, 54.0, 68.0, 60.0, 55.0, 57.0, 60.0, 43.0, 47.0, 17.0, 46.0, 35.0, 23.0, 23.0, 24.0, 19.0, 11.0, 5.0, 7.0, 3.0, 7.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-26.314420700073242, -25.57833480834961, -24.842247009277344, -24.10616111755371, -23.370073318481445, -22.633987426757812, -21.897899627685547, -21.161813735961914, -20.42572784423828, -19.68964195251465, -18.953554153442383, -18.21746826171875, -17.481380462646484, -16.74529457092285, -16.00920867919922, -15.273120880126953, -14.537034034729004, -13.800947189331055, -13.064860343933105, -12.328773498535156, -11.592687606811523, -10.856600761413574, -10.120513916015625, -9.384428024291992, -8.648340225219727, -7.912253379821777, -7.176167011260986, -6.440080165863037, -5.703993797302246, -4.967906951904297, -4.231820106506348, -3.4957337379455566, -2.7596473693847656, -2.0235607624053955, -1.2874740362167358, -0.5513873100280762, 0.18469929695129395, 0.9207859039306641, 1.6568727493286133, 2.3929591178894043, 3.1290459632873535, 3.8651325702667236, 4.601219177246094, 5.337306022644043, 6.073392868041992, 6.809479236602783, 7.545566082000732, 8.281652450561523, 9.017739295959473, 9.753826141357422, 10.489912986755371, 11.22599983215332, 11.962085723876953, 12.698172569274902, 13.434259414672852, 14.170345306396484, 14.90643310546875, 15.6425199508667, 16.37860679626465, 17.11469268798828, 17.850780487060547, 18.58686637878418, 19.322952270507812, 20.059040069580078, 20.79512596130371]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 3.0, 8.0, 6.0, 13.0, 18.0, 33.0, 51.0, 85.0, 145.0, 244.0, 465.0, 1029.0, 2223.0, 5363.0, 15076.0, 56912.0, 624502.0, 3312957.0, 133772.0, 26368.0, 8526.0, 3376.0, 1384.0, 758.0, 400.0, 202.0, 109.0, 92.0, 52.0, 36.0, 20.0, 15.0, 14.0, 6.0, 5.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.07421875, -1.998077392578125, -1.92193603515625, -1.845794677734375, -1.7696533203125, -1.693511962890625, -1.61737060546875, -1.541229248046875, -1.465087890625, -1.388946533203125, -1.31280517578125, -1.236663818359375, -1.1605224609375, -1.084381103515625, -1.00823974609375, -0.932098388671875, -0.85595703125, -0.779815673828125, -0.70367431640625, -0.627532958984375, -0.5513916015625, -0.475250244140625, -0.39910888671875, -0.322967529296875, -0.246826171875, -0.170684814453125, -0.09454345703125, -0.018402099609375, 0.0577392578125, 0.133880615234375, 0.21002197265625, 0.286163330078125, 0.3623046875, 0.438446044921875, 0.51458740234375, 0.590728759765625, 0.6668701171875, 0.743011474609375, 0.81915283203125, 0.895294189453125, 0.971435546875, 1.047576904296875, 1.12371826171875, 1.199859619140625, 1.2760009765625, 1.352142333984375, 1.42828369140625, 1.504425048828125, 1.58056640625, 1.656707763671875, 1.73284912109375, 1.808990478515625, 1.8851318359375, 1.961273193359375, 2.03741455078125, 2.113555908203125, 2.189697265625, 2.265838623046875, 2.34197998046875, 2.418121337890625, 2.4942626953125, 2.570404052734375, 2.64654541015625, 2.722686767578125, 2.798828125]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 7.0, 8.0, 7.0, 8.0, 12.0, 25.0, 20.0, 31.0, 35.0, 32.0, 40.0, 46.0, 54.0, 53.0, 65.0, 62.0, 58.0, 56.0, 60.0, 42.0, 37.0, 39.0, 42.0, 38.0, 25.0, 23.0, 12.0, 16.0, 10.0, 10.0, 9.0, 9.0, 3.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.96630859375, -0.9319381713867188, -0.8975677490234375, -0.8631973266601562, -0.828826904296875, -0.7944564819335938, -0.7600860595703125, -0.7257156372070312, -0.69134521484375, -0.6569747924804688, -0.6226043701171875, -0.5882339477539062, -0.553863525390625, -0.5194931030273438, -0.4851226806640625, -0.45075225830078125, -0.4163818359375, -0.38201141357421875, -0.3476409912109375, -0.31327056884765625, -0.278900146484375, -0.24452972412109375, -0.2101593017578125, -0.17578887939453125, -0.14141845703125, -0.10704803466796875, -0.0726776123046875, -0.03830718994140625, -0.003936767578125, 0.03043365478515625, 0.0648040771484375, 0.09917449951171875, 0.133544921875, 0.16791534423828125, 0.2022857666015625, 0.23665618896484375, 0.271026611328125, 0.30539703369140625, 0.3397674560546875, 0.37413787841796875, 0.40850830078125, 0.44287872314453125, 0.4772491455078125, 0.5116195678710938, 0.545989990234375, 0.5803604125976562, 0.6147308349609375, 0.6491012573242188, 0.6834716796875, 0.7178421020507812, 0.7522125244140625, 0.7865829467773438, 0.820953369140625, 0.8553237915039062, 0.8896942138671875, 0.9240646362304688, 0.95843505859375, 0.9928054809570312, 1.0271759033203125, 1.0615463256835938, 1.095916748046875, 1.1302871704101562, 1.1646575927734375, 1.1990280151367188, 1.2333984375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 5.0, 2.0, 4.0, 0.0, 6.0, 9.0, 5.0, 14.0, 25.0, 28.0, 81.0, 146.0, 350.0, 1000.0, 3940.0, 22370.0, 373989.0, 3718752.0, 62358.0, 8333.0, 1928.0, 534.0, 189.0, 88.0, 46.0, 24.0, 19.0, 12.0, 11.0, 6.0, 5.0, 1.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.35546875, -4.20648193359375, -4.0574951171875, -3.90850830078125, -3.759521484375, -3.61053466796875, -3.4615478515625, -3.31256103515625, -3.16357421875, -3.01458740234375, -2.8656005859375, -2.71661376953125, -2.567626953125, -2.41864013671875, -2.2696533203125, -2.12066650390625, -1.9716796875, -1.82269287109375, -1.6737060546875, -1.52471923828125, -1.375732421875, -1.22674560546875, -1.0777587890625, -0.92877197265625, -0.77978515625, -0.63079833984375, -0.4818115234375, -0.33282470703125, -0.183837890625, -0.03485107421875, 0.1141357421875, 0.26312255859375, 0.412109375, 0.56109619140625, 0.7100830078125, 0.85906982421875, 1.008056640625, 1.15704345703125, 1.3060302734375, 1.45501708984375, 1.60400390625, 1.75299072265625, 1.9019775390625, 2.05096435546875, 2.199951171875, 2.34893798828125, 2.4979248046875, 2.64691162109375, 2.7958984375, 2.94488525390625, 3.0938720703125, 3.24285888671875, 3.391845703125, 3.54083251953125, 3.6898193359375, 3.83880615234375, 3.98779296875, 4.13677978515625, 4.2857666015625, 4.43475341796875, 4.583740234375, 4.73272705078125, 4.8817138671875, 5.03070068359375, 5.1796875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 5.0, 6.0, 10.0, 8.0, 13.0, 19.0, 24.0, 36.0, 51.0, 102.0, 144.0, 304.0, 767.0, 1511.0, 583.0, 208.0, 95.0, 45.0, 41.0, 29.0, 19.0, 13.0, 14.0, 5.0, 7.0, 4.0, 2.0, 1.0, 5.0, 3.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.33203125, -4.2188720703125, -4.105712890625, -3.9925537109375, -3.87939453125, -3.7662353515625, -3.653076171875, -3.5399169921875, -3.4267578125, -3.3135986328125, -3.200439453125, -3.0872802734375, -2.97412109375, -2.8609619140625, -2.747802734375, -2.6346435546875, -2.521484375, -2.4083251953125, -2.295166015625, -2.1820068359375, -2.06884765625, -1.9556884765625, -1.842529296875, -1.7293701171875, -1.6162109375, -1.5030517578125, -1.389892578125, -1.2767333984375, -1.16357421875, -1.0504150390625, -0.937255859375, -0.8240966796875, -0.7109375, -0.5977783203125, -0.484619140625, -0.3714599609375, -0.25830078125, -0.1451416015625, -0.031982421875, 0.0811767578125, 0.1943359375, 0.3074951171875, 0.420654296875, 0.5338134765625, 0.64697265625, 0.7601318359375, 0.873291015625, 0.9864501953125, 1.099609375, 1.2127685546875, 1.325927734375, 1.4390869140625, 1.55224609375, 1.6654052734375, 1.778564453125, 1.8917236328125, 2.0048828125, 2.1180419921875, 2.231201171875, 2.3443603515625, 2.45751953125, 2.5706787109375, 2.683837890625, 2.7969970703125, 2.91015625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 7.0, 5.0, 9.0, 21.0, 33.0, 76.0, 133.0, 243.0, 219.0, 127.0, 78.0, 29.0, 12.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.203954696655273, -27.14052963256836, -26.077106475830078, -25.013681411743164, -23.95025634765625, -22.88683319091797, -21.823408126831055, -20.75998306274414, -19.69655990600586, -18.633134841918945, -17.569711685180664, -16.50628662109375, -15.442862510681152, -14.379438400268555, -13.31601333618164, -12.252589225769043, -11.189165115356445, -10.125741004943848, -9.06231689453125, -7.998891830444336, -6.935467720031738, -5.872043609619141, -4.808619022369385, -3.745194435119629, -2.6817703247070312, -1.6183459758758545, -0.5549216270446777, 0.508502721786499, 1.5719270706176758, 2.6353511810302734, 3.6987757682800293, 4.762200355529785, 5.82562255859375, 6.889046669006348, 7.9524712562561035, 9.01589584350586, 10.079319953918457, 11.142744064331055, 12.206169128417969, 13.269593238830566, 14.333017349243164, 15.396441459655762, 16.45986557006836, 17.523290634155273, 18.586715698242188, 19.65013885498047, 20.713563919067383, 21.776988983154297, 22.840412139892578, 23.903837203979492, 24.967260360717773, 26.030685424804688, 27.09410858154297, 28.157533645629883, 29.220958709716797, 30.284381866455078, 31.347806930541992, 32.411231994628906, 33.47465515136719, 34.53807830810547, 35.601505279541016, 36.6649284362793, 37.72835159301758, 38.791778564453125, 39.855201721191406]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 4.0, 5.0, 7.0, 13.0, 17.0, 16.0, 23.0, 29.0, 31.0, 41.0, 27.0, 47.0, 54.0, 58.0, 65.0, 83.0, 64.0, 66.0, 62.0, 55.0, 44.0, 41.0, 33.0, 30.0, 23.0, 19.0, 16.0, 9.0, 3.0, 5.0, 7.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.64159393310547, -16.08203887939453, -15.522483825683594, -14.962928771972656, -14.403374671936035, -13.843819618225098, -13.28426456451416, -12.724709510803223, -12.165155410766602, -11.605600357055664, -11.046045303344727, -10.486490249633789, -9.926936149597168, -9.36738109588623, -8.807826042175293, -8.248270988464355, -7.688715934753418, -7.1291608810424805, -6.569606304168701, -6.010051250457764, -5.450496673583984, -4.890941619873047, -4.331386566162109, -3.771831750869751, -3.2122769355773926, -2.652722120285034, -2.093167304992676, -1.5336122512817383, -0.9740574359893799, -0.4145026206970215, 0.14505243301391602, 0.7046072483062744, 1.2641620635986328, 1.8237168788909912, 2.3832716941833496, 2.942826747894287, 3.5023815631866455, 4.061936378479004, 4.621491432189941, 5.181046485900879, 5.740601062774658, 6.300156116485596, 6.859710693359375, 7.4192657470703125, 7.97882080078125, 8.538375854492188, 9.097930908203125, 9.657485008239746, 10.217040061950684, 10.776595115661621, 11.336150169372559, 11.89570426940918, 12.455259323120117, 13.014814376831055, 13.574369430541992, 14.13392448425293, 14.693479537963867, 15.253034591674805, 15.812589645385742, 16.37214469909668, 16.931699752807617, 17.491252899169922, 18.05080795288086, 18.610363006591797, 19.169918060302734]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 1.0, 8.0, 7.0, 9.0, 21.0, 23.0, 35.0, 56.0, 91.0, 127.0, 186.0, 300.0, 517.0, 863.0, 1439.0, 2460.0, 4559.0, 8779.0, 17123.0, 36152.0, 76015.0, 157046.0, 264373.0, 235266.0, 125374.0, 59923.0, 28160.0, 13727.0, 7011.0, 3756.0, 2095.0, 1177.0, 692.0, 394.0, 264.0, 166.0, 123.0, 83.0, 54.0, 38.0, 30.0, 19.0, 4.0, 5.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.361328125, -1.3171844482421875, -1.273040771484375, -1.2288970947265625, -1.18475341796875, -1.1406097412109375, -1.096466064453125, -1.0523223876953125, -1.0081787109375, -0.9640350341796875, -0.919891357421875, -0.8757476806640625, -0.83160400390625, -0.7874603271484375, -0.743316650390625, -0.6991729736328125, -0.655029296875, -0.6108856201171875, -0.566741943359375, -0.5225982666015625, -0.47845458984375, -0.4343109130859375, -0.390167236328125, -0.3460235595703125, -0.3018798828125, -0.2577362060546875, -0.213592529296875, -0.1694488525390625, -0.12530517578125, -0.0811614990234375, -0.037017822265625, 0.0071258544921875, 0.05126953125, 0.0954132080078125, 0.139556884765625, 0.1837005615234375, 0.22784423828125, 0.2719879150390625, 0.316131591796875, 0.3602752685546875, 0.4044189453125, 0.4485626220703125, 0.492706298828125, 0.5368499755859375, 0.58099365234375, 0.6251373291015625, 0.669281005859375, 0.7134246826171875, 0.757568359375, 0.8017120361328125, 0.845855712890625, 0.8899993896484375, 0.93414306640625, 0.9782867431640625, 1.022430419921875, 1.0665740966796875, 1.1107177734375, 1.1548614501953125, 1.199005126953125, 1.2431488037109375, 1.28729248046875, 1.3314361572265625, 1.375579833984375, 1.4197235107421875, 1.4638671875]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 3.0, 4.0, 0.0, 4.0, 6.0, 13.0, 16.0, 19.0, 25.0, 29.0, 32.0, 33.0, 53.0, 33.0, 46.0, 63.0, 47.0, 44.0, 54.0, 49.0, 56.0, 48.0, 62.0, 36.0, 40.0, 32.0, 24.0, 20.0, 31.0, 18.0, 16.0, 10.0, 8.0, 8.0, 6.0, 5.0, 7.0, 4.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0244140625, -0.9920806884765625, -0.959747314453125, -0.9274139404296875, -0.89508056640625, -0.8627471923828125, -0.830413818359375, -0.7980804443359375, -0.7657470703125, -0.7334136962890625, -0.701080322265625, -0.6687469482421875, -0.63641357421875, -0.6040802001953125, -0.571746826171875, -0.5394134521484375, -0.507080078125, -0.4747467041015625, -0.442413330078125, -0.4100799560546875, -0.37774658203125, -0.3454132080078125, -0.313079833984375, -0.2807464599609375, -0.2484130859375, -0.2160797119140625, -0.183746337890625, -0.1514129638671875, -0.11907958984375, -0.0867462158203125, -0.054412841796875, -0.0220794677734375, 0.01025390625, 0.0425872802734375, 0.074920654296875, 0.1072540283203125, 0.13958740234375, 0.1719207763671875, 0.204254150390625, 0.2365875244140625, 0.2689208984375, 0.3012542724609375, 0.333587646484375, 0.3659210205078125, 0.39825439453125, 0.4305877685546875, 0.462921142578125, 0.4952545166015625, 0.527587890625, 0.5599212646484375, 0.592254638671875, 0.6245880126953125, 0.65692138671875, 0.6892547607421875, 0.721588134765625, 0.7539215087890625, 0.7862548828125, 0.8185882568359375, 0.850921630859375, 0.8832550048828125, 0.91558837890625, 0.9479217529296875, 0.980255126953125, 1.0125885009765625, 1.044921875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 10.0, 9.0, 9.0, 20.0, 28.0, 40.0, 63.0, 110.0, 146.0, 213.0, 335.0, 553.0, 872.0, 1865.0, 4383.0, 14832.0, 77468.0, 561147.0, 323038.0, 46319.0, 10096.0, 3351.0, 1501.0, 829.0, 495.0, 262.0, 193.0, 117.0, 93.0, 42.0, 34.0, 24.0, 21.0, 12.0, 9.0, 10.0, 5.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.904296875, -2.8101806640625, -2.716064453125, -2.6219482421875, -2.52783203125, -2.4337158203125, -2.339599609375, -2.2454833984375, -2.1513671875, -2.0572509765625, -1.963134765625, -1.8690185546875, -1.77490234375, -1.6807861328125, -1.586669921875, -1.4925537109375, -1.3984375, -1.3043212890625, -1.210205078125, -1.1160888671875, -1.02197265625, -0.9278564453125, -0.833740234375, -0.7396240234375, -0.6455078125, -0.5513916015625, -0.457275390625, -0.3631591796875, -0.26904296875, -0.1749267578125, -0.080810546875, 0.0133056640625, 0.107421875, 0.2015380859375, 0.295654296875, 0.3897705078125, 0.48388671875, 0.5780029296875, 0.672119140625, 0.7662353515625, 0.8603515625, 0.9544677734375, 1.048583984375, 1.1427001953125, 1.23681640625, 1.3309326171875, 1.425048828125, 1.5191650390625, 1.61328125, 1.7073974609375, 1.801513671875, 1.8956298828125, 1.98974609375, 2.0838623046875, 2.177978515625, 2.2720947265625, 2.3662109375, 2.4603271484375, 2.554443359375, 2.6485595703125, 2.74267578125, 2.8367919921875, 2.930908203125, 3.0250244140625, 3.119140625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 3.0, 3.0, 7.0, 3.0, 10.0, 7.0, 11.0, 9.0, 16.0, 14.0, 14.0, 18.0, 22.0, 28.0, 36.0, 37.0, 25.0, 46.0, 40.0, 36.0, 46.0, 53.0, 37.0, 45.0, 52.0, 37.0, 37.0, 44.0, 33.0, 42.0, 37.0, 27.0, 15.0, 25.0, 18.0, 16.0, 12.0, 3.0, 5.0, 8.0, 3.0, 7.0, 4.0, 2.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-3.626953125, -3.511871337890625, -3.39678955078125, -3.281707763671875, -3.1666259765625, -3.051544189453125, -2.93646240234375, -2.821380615234375, -2.706298828125, -2.591217041015625, -2.47613525390625, -2.361053466796875, -2.2459716796875, -2.130889892578125, -2.01580810546875, -1.900726318359375, -1.78564453125, -1.670562744140625, -1.55548095703125, -1.440399169921875, -1.3253173828125, -1.210235595703125, -1.09515380859375, -0.980072021484375, -0.864990234375, -0.749908447265625, -0.63482666015625, -0.519744873046875, -0.4046630859375, -0.289581298828125, -0.17449951171875, -0.059417724609375, 0.0556640625, 0.170745849609375, 0.28582763671875, 0.400909423828125, 0.5159912109375, 0.631072998046875, 0.74615478515625, 0.861236572265625, 0.976318359375, 1.091400146484375, 1.20648193359375, 1.321563720703125, 1.4366455078125, 1.551727294921875, 1.66680908203125, 1.781890869140625, 1.89697265625, 2.012054443359375, 2.12713623046875, 2.242218017578125, 2.3572998046875, 2.472381591796875, 2.58746337890625, 2.702545166015625, 2.817626953125, 2.932708740234375, 3.04779052734375, 3.162872314453125, 3.2779541015625, 3.393035888671875, 3.50811767578125, 3.623199462890625, 3.73828125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 6.0, 2.0, 1.0, 8.0, 16.0, 25.0, 41.0, 67.0, 114.0, 229.0, 451.0, 1068.0, 3575.0, 22706.0, 591134.0, 405261.0, 18668.0, 3258.0, 1078.0, 425.0, 181.0, 97.0, 46.0, 33.0, 24.0, 12.0, 13.0, 6.0, 4.0, 5.0, 2.0, 3.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.484375, -1.42718505859375, -1.3699951171875, -1.31280517578125, -1.255615234375, -1.19842529296875, -1.1412353515625, -1.08404541015625, -1.02685546875, -0.96966552734375, -0.9124755859375, -0.85528564453125, -0.798095703125, -0.74090576171875, -0.6837158203125, -0.62652587890625, -0.5693359375, -0.51214599609375, -0.4549560546875, -0.39776611328125, -0.340576171875, -0.28338623046875, -0.2261962890625, -0.16900634765625, -0.11181640625, -0.05462646484375, 0.0025634765625, 0.05975341796875, 0.116943359375, 0.17413330078125, 0.2313232421875, 0.28851318359375, 0.345703125, 0.40289306640625, 0.4600830078125, 0.51727294921875, 0.574462890625, 0.63165283203125, 0.6888427734375, 0.74603271484375, 0.80322265625, 0.86041259765625, 0.9176025390625, 0.97479248046875, 1.031982421875, 1.08917236328125, 1.1463623046875, 1.20355224609375, 1.2607421875, 1.31793212890625, 1.3751220703125, 1.43231201171875, 1.489501953125, 1.54669189453125, 1.6038818359375, 1.66107177734375, 1.71826171875, 1.77545166015625, 1.8326416015625, 1.88983154296875, 1.947021484375, 2.00421142578125, 2.0614013671875, 2.11859130859375, 2.17578125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 6.0, 7.0, 6.0, 11.0, 18.0, 16.0, 30.0, 32.0, 30.0, 40.0, 63.0, 74.0, 94.0, 101.0, 93.0, 81.0, 73.0, 70.0, 31.0, 37.0, 22.0, 18.0, 13.0, 11.0, 1.0, 8.0, 3.0, 2.0, 4.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.00025963783264160156, -0.00025326013565063477, -0.00024688243865966797, -0.00024050474166870117, -0.00023412704467773438, -0.00022774934768676758, -0.00022137165069580078, -0.00021499395370483398, -0.0002086162567138672, -0.0002022385597229004, -0.0001958608627319336, -0.0001894831657409668, -0.00018310546875, -0.0001767277717590332, -0.0001703500747680664, -0.0001639723777770996, -0.0001575946807861328, -0.00015121698379516602, -0.00014483928680419922, -0.00013846158981323242, -0.00013208389282226562, -0.00012570619583129883, -0.00011932849884033203, -0.00011295080184936523, -0.00010657310485839844, -0.00010019540786743164, -9.381771087646484e-05, -8.744001388549805e-05, -8.106231689453125e-05, -7.468461990356445e-05, -6.830692291259766e-05, -6.192922592163086e-05, -5.555152893066406e-05, -4.9173831939697266e-05, -4.279613494873047e-05, -3.641843795776367e-05, -3.0040740966796875e-05, -2.3663043975830078e-05, -1.728534698486328e-05, -1.0907649993896484e-05, -4.5299530029296875e-06, 1.8477439880371094e-06, 8.225440979003906e-06, 1.4603137969970703e-05, 2.09808349609375e-05, 2.7358531951904297e-05, 3.3736228942871094e-05, 4.011392593383789e-05, 4.649162292480469e-05, 5.2869319915771484e-05, 5.924701690673828e-05, 6.562471389770508e-05, 7.200241088867188e-05, 7.838010787963867e-05, 8.475780487060547e-05, 9.113550186157227e-05, 9.751319885253906e-05, 0.00010389089584350586, 0.00011026859283447266, 0.00011664628982543945, 0.00012302398681640625, 0.00012940168380737305, 0.00013577938079833984, 0.00014215707778930664, 0.00014853477478027344]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 3.0, 7.0, 9.0, 20.0, 22.0, 31.0, 43.0, 76.0, 148.0, 277.0, 554.0, 1278.0, 3431.0, 13945.0, 123505.0, 764892.0, 120715.0, 13728.0, 3409.0, 1228.0, 540.0, 271.0, 161.0, 97.0, 60.0, 37.0, 27.0, 14.0, 8.0, 4.0, 2.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0], "bins": [-1.8603515625, -1.8165740966796875, -1.772796630859375, -1.7290191650390625, -1.68524169921875, -1.6414642333984375, -1.597686767578125, -1.5539093017578125, -1.5101318359375, -1.4663543701171875, -1.422576904296875, -1.3787994384765625, -1.33502197265625, -1.2912445068359375, -1.247467041015625, -1.2036895751953125, -1.159912109375, -1.1161346435546875, -1.072357177734375, -1.0285797119140625, -0.98480224609375, -0.9410247802734375, -0.897247314453125, -0.8534698486328125, -0.8096923828125, -0.7659149169921875, -0.722137451171875, -0.6783599853515625, -0.63458251953125, -0.5908050537109375, -0.547027587890625, -0.5032501220703125, -0.45947265625, -0.4156951904296875, -0.371917724609375, -0.3281402587890625, -0.28436279296875, -0.2405853271484375, -0.196807861328125, -0.1530303955078125, -0.1092529296875, -0.0654754638671875, -0.021697998046875, 0.0220794677734375, 0.06585693359375, 0.1096343994140625, 0.153411865234375, 0.1971893310546875, 0.240966796875, 0.2847442626953125, 0.328521728515625, 0.3722991943359375, 0.41607666015625, 0.4598541259765625, 0.503631591796875, 0.5474090576171875, 0.5911865234375, 0.6349639892578125, 0.678741455078125, 0.7225189208984375, 0.76629638671875, 0.8100738525390625, 0.853851318359375, 0.8976287841796875, 0.94140625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 4.0, 4.0, 10.0, 21.0, 24.0, 36.0, 42.0, 74.0, 78.0, 62.0, 92.0, 116.0, 96.0, 90.0, 69.0, 44.0, 41.0, 29.0, 29.0, 14.0, 4.0, 11.0, 6.0, 0.0, 7.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.103515625, -2.0527496337890625, -2.001983642578125, -1.9512176513671875, -1.90045166015625, -1.8496856689453125, -1.798919677734375, -1.7481536865234375, -1.6973876953125, -1.6466217041015625, -1.595855712890625, -1.5450897216796875, -1.49432373046875, -1.4435577392578125, -1.392791748046875, -1.3420257568359375, -1.291259765625, -1.2404937744140625, -1.189727783203125, -1.1389617919921875, -1.08819580078125, -1.0374298095703125, -0.986663818359375, -0.9358978271484375, -0.8851318359375, -0.8343658447265625, -0.783599853515625, -0.7328338623046875, -0.68206787109375, -0.6313018798828125, -0.580535888671875, -0.5297698974609375, -0.47900390625, -0.4282379150390625, -0.377471923828125, -0.3267059326171875, -0.27593994140625, -0.2251739501953125, -0.174407958984375, -0.1236419677734375, -0.0728759765625, -0.0221099853515625, 0.028656005859375, 0.0794219970703125, 0.13018798828125, 0.1809539794921875, 0.231719970703125, 0.2824859619140625, 0.333251953125, 0.3840179443359375, 0.434783935546875, 0.4855499267578125, 0.53631591796875, 0.5870819091796875, 0.637847900390625, 0.6886138916015625, 0.7393798828125, 0.7901458740234375, 0.840911865234375, 0.8916778564453125, 0.94244384765625, 0.9932098388671875, 1.043975830078125, 1.0947418212890625, 1.1455078125]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 10.0, 6.0, 21.0, 107.0, 242.0, 357.0, 193.0, 48.0, 11.0, 7.0, 5.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.57146453857422, -38.9788818359375, -37.38629913330078, -35.79371643066406, -34.201133728027344, -32.608551025390625, -31.01597023010254, -29.42338752746582, -27.8308048248291, -26.238222122192383, -24.645639419555664, -23.053058624267578, -21.46047592163086, -19.86789321899414, -18.275310516357422, -16.682727813720703, -15.090145111083984, -13.497562408447266, -11.904979705810547, -10.312397956848145, -8.719815254211426, -7.127232551574707, -5.534650802612305, -3.942068099975586, -2.349485397338867, -0.7569029331207275, 0.8356795310974121, 2.4282617568969727, 4.020844459533691, 5.61342716217041, 7.2060089111328125, 8.798591613769531, 10.391170501708984, 11.983753204345703, 13.576335906982422, 15.168917655944824, 16.76150131225586, 18.354084014892578, 19.946664810180664, 21.539247512817383, 23.1318302154541, 24.72441291809082, 26.31699562072754, 27.909576416015625, 29.502159118652344, 31.094741821289062, 32.68732452392578, 34.2799072265625, 35.87248992919922, 37.46507263183594, 39.057655334472656, 40.650238037109375, 42.242820739746094, 43.83540344238281, 45.42798614501953, 47.02056884765625, 48.61315155029297, 50.20573425292969, 51.798316955566406, 53.390899658203125, 54.983482360839844, 56.57606506347656, 58.16864776611328, 59.76123046875, 61.35380935668945]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 5.0, 5.0, 8.0, 11.0, 9.0, 16.0, 13.0, 23.0, 35.0, 30.0, 30.0, 49.0, 74.0, 73.0, 71.0, 81.0, 77.0, 58.0, 63.0, 51.0, 44.0, 50.0, 30.0, 23.0, 16.0, 10.0, 12.0, 19.0, 8.0, 5.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.497474670410156, -23.804574966430664, -23.11167335510254, -22.418773651123047, -21.725872039794922, -21.03297233581543, -20.340072631835938, -19.647171020507812, -18.95427131652832, -18.261371612548828, -17.568470001220703, -16.87557029724121, -16.18267059326172, -15.489768981933594, -14.796869277954102, -14.103968620300293, -13.411067962646484, -12.718167304992676, -12.025266647338867, -11.332366943359375, -10.639466285705566, -9.946565628051758, -9.253665924072266, -8.560765266418457, -7.867864608764648, -7.17496395111084, -6.4820637702941895, -5.789163589477539, -5.0962629318237305, -4.403362274169922, -3.7104620933532715, -3.017561912536621, -2.3246631622314453, -1.6317627429962158, -0.9388623237609863, -0.24596190452575684, 0.44693851470947266, 1.1398389339447021, 1.8327393531799316, 2.525639533996582, 3.2185401916503906, 3.91144061088562, 4.60434103012085, 5.2972412109375, 5.990141868591309, 6.683042526245117, 7.375942707061768, 8.068842887878418, 8.761743545532227, 9.454644203186035, 10.147544860839844, 10.840444564819336, 11.533345222473145, 12.226245880126953, 12.919145584106445, 13.612046241760254, 14.304946899414062, 14.997847557067871, 15.69074821472168, 16.383647918701172, 17.076549530029297, 17.76944923400879, 18.46234893798828, 19.155250549316406, 19.8481502532959]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 1.0, 3.0, 5.0, 9.0, 13.0, 13.0, 12.0, 15.0, 30.0, 24.0, 45.0, 77.0, 116.0, 222.0, 619.0, 4986.0, 170221.0, 3997475.0, 18003.0, 1497.0, 383.0, 170.0, 99.0, 71.0, 46.0, 32.0, 24.0, 19.0, 12.0, 14.0, 7.0, 8.0, 4.0, 1.0, 1.0, 6.0, 2.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.03125, -5.86016845703125, -5.6890869140625, -5.51800537109375, -5.346923828125, -5.17584228515625, -5.0047607421875, -4.83367919921875, -4.66259765625, -4.49151611328125, -4.3204345703125, -4.14935302734375, -3.978271484375, -3.80718994140625, -3.6361083984375, -3.46502685546875, -3.2939453125, -3.12286376953125, -2.9517822265625, -2.78070068359375, -2.609619140625, -2.43853759765625, -2.2674560546875, -2.09637451171875, -1.92529296875, -1.75421142578125, -1.5831298828125, -1.41204833984375, -1.240966796875, -1.06988525390625, -0.8988037109375, -0.72772216796875, -0.556640625, -0.38555908203125, -0.2144775390625, -0.04339599609375, 0.127685546875, 0.29876708984375, 0.4698486328125, 0.64093017578125, 0.81201171875, 0.98309326171875, 1.1541748046875, 1.32525634765625, 1.496337890625, 1.66741943359375, 1.8385009765625, 2.00958251953125, 2.1806640625, 2.35174560546875, 2.5228271484375, 2.69390869140625, 2.864990234375, 3.03607177734375, 3.2071533203125, 3.37823486328125, 3.54931640625, 3.72039794921875, 3.8914794921875, 4.06256103515625, 4.233642578125, 4.40472412109375, 4.5758056640625, 4.74688720703125, 4.91796875]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 7.0, 12.0, 22.0, 42.0, 69.0, 99.0, 137.0, 125.0, 147.0, 116.0, 95.0, 55.0, 46.0, 20.0, 4.0, 4.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.365234375, -2.280487060546875, -2.19573974609375, -2.110992431640625, -2.0262451171875, -1.941497802734375, -1.85675048828125, -1.772003173828125, -1.687255859375, -1.602508544921875, -1.51776123046875, -1.433013916015625, -1.3482666015625, -1.263519287109375, -1.17877197265625, -1.094024658203125, -1.00927734375, -0.924530029296875, -0.83978271484375, -0.755035400390625, -0.6702880859375, -0.585540771484375, -0.50079345703125, -0.416046142578125, -0.331298828125, -0.246551513671875, -0.16180419921875, -0.077056884765625, 0.0076904296875, 0.092437744140625, 0.17718505859375, 0.261932373046875, 0.3466796875, 0.431427001953125, 0.51617431640625, 0.600921630859375, 0.6856689453125, 0.770416259765625, 0.85516357421875, 0.939910888671875, 1.024658203125, 1.109405517578125, 1.19415283203125, 1.278900146484375, 1.3636474609375, 1.448394775390625, 1.53314208984375, 1.617889404296875, 1.70263671875, 1.787384033203125, 1.87213134765625, 1.956878662109375, 2.0416259765625, 2.126373291015625, 2.21112060546875, 2.295867919921875, 2.380615234375, 2.465362548828125, 2.55010986328125, 2.634857177734375, 2.7196044921875, 2.804351806640625, 2.88909912109375, 2.973846435546875, 3.05859375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 2.0, 10.0, 2.0, 8.0, 3.0, 14.0, 10.0, 25.0, 36.0, 76.0, 155.0, 291.0, 691.0, 1528.0, 3573.0, 9308.0, 25867.0, 103746.0, 1586633.0, 2290769.0, 123967.0, 29106.0, 10393.0, 4275.0, 1946.0, 860.0, 427.0, 246.0, 122.0, 70.0, 35.0, 32.0, 22.0, 11.0, 9.0, 2.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.52734375, -1.468719482421875, -1.41009521484375, -1.351470947265625, -1.2928466796875, -1.234222412109375, -1.17559814453125, -1.116973876953125, -1.058349609375, -0.999725341796875, -0.94110107421875, -0.882476806640625, -0.8238525390625, -0.765228271484375, -0.70660400390625, -0.647979736328125, -0.58935546875, -0.530731201171875, -0.47210693359375, -0.413482666015625, -0.3548583984375, -0.296234130859375, -0.23760986328125, -0.178985595703125, -0.120361328125, -0.061737060546875, -0.00311279296875, 0.055511474609375, 0.1141357421875, 0.172760009765625, 0.23138427734375, 0.290008544921875, 0.3486328125, 0.407257080078125, 0.46588134765625, 0.524505615234375, 0.5831298828125, 0.641754150390625, 0.70037841796875, 0.759002685546875, 0.817626953125, 0.876251220703125, 0.93487548828125, 0.993499755859375, 1.0521240234375, 1.110748291015625, 1.16937255859375, 1.227996826171875, 1.28662109375, 1.345245361328125, 1.40386962890625, 1.462493896484375, 1.5211181640625, 1.579742431640625, 1.63836669921875, 1.696990966796875, 1.755615234375, 1.814239501953125, 1.87286376953125, 1.931488037109375, 1.9901123046875, 2.048736572265625, 2.10736083984375, 2.165985107421875, 2.224609375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 2.0, 4.0, 3.0, 5.0, 6.0, 5.0, 10.0, 7.0, 6.0, 17.0, 16.0, 32.0, 30.0, 56.0, 80.0, 121.0, 237.0, 401.0, 725.0, 868.0, 592.0, 308.0, 182.0, 104.0, 73.0, 43.0, 35.0, 21.0, 19.0, 9.0, 11.0, 5.0, 9.0, 4.0, 6.0, 6.0, 5.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.376953125, -1.318084716796875, -1.25921630859375, -1.200347900390625, -1.1414794921875, -1.082611083984375, -1.02374267578125, -0.964874267578125, -0.906005859375, -0.847137451171875, -0.78826904296875, -0.729400634765625, -0.6705322265625, -0.611663818359375, -0.55279541015625, -0.493927001953125, -0.43505859375, -0.376190185546875, -0.31732177734375, -0.258453369140625, -0.1995849609375, -0.140716552734375, -0.08184814453125, -0.022979736328125, 0.035888671875, 0.094757080078125, 0.15362548828125, 0.212493896484375, 0.2713623046875, 0.330230712890625, 0.38909912109375, 0.447967529296875, 0.5068359375, 0.565704345703125, 0.62457275390625, 0.683441162109375, 0.7423095703125, 0.801177978515625, 0.86004638671875, 0.918914794921875, 0.977783203125, 1.036651611328125, 1.09552001953125, 1.154388427734375, 1.2132568359375, 1.272125244140625, 1.33099365234375, 1.389862060546875, 1.44873046875, 1.507598876953125, 1.56646728515625, 1.625335693359375, 1.6842041015625, 1.743072509765625, 1.80194091796875, 1.860809326171875, 1.919677734375, 1.978546142578125, 2.03741455078125, 2.096282958984375, 2.1551513671875, 2.214019775390625, 2.27288818359375, 2.331756591796875, 2.390625]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 8.0, 4.0, 7.0, 17.0, 55.0, 126.0, 255.0, 266.0, 154.0, 63.0, 29.0, 11.0, 4.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-39.99540328979492, -39.19813537597656, -38.40087127685547, -37.60360336303711, -36.80633544921875, -36.00906753540039, -35.2118034362793, -34.41453552246094, -33.61726760864258, -32.81999969482422, -32.022735595703125, -31.225467681884766, -30.428199768066406, -29.63093376159668, -28.833667755126953, -28.036399841308594, -27.239133834838867, -26.44186782836914, -25.64459991455078, -24.847333908081055, -24.050065994262695, -23.25279998779297, -22.45553207397461, -21.658266067504883, -20.861000061035156, -20.06373405456543, -19.26646614074707, -18.469200134277344, -17.671932220458984, -16.874666213989258, -16.07740020751953, -15.280132293701172, -14.482866287231445, -13.685599327087402, -12.88833236694336, -12.091066360473633, -11.293798446655273, -10.496532440185547, -9.699265480041504, -8.901998519897461, -8.104731559753418, -7.307464599609375, -6.510197639465332, -5.712931156158447, -4.915664196014404, -4.118397235870361, -3.3211307525634766, -2.5238637924194336, -1.7265968322753906, -0.9293299913406372, -0.1320631504058838, 0.6652035713195801, 1.462470531463623, 2.259737491607666, 3.057003974914551, 3.8542709350585938, 4.651537895202637, 5.44880485534668, 6.246071815490723, 7.043338298797607, 7.84060525894165, 8.637872695922852, 9.435138702392578, 10.232405662536621, 11.029672622680664]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 3.0, 4.0, 5.0, 9.0, 6.0, 19.0, 11.0, 22.0, 23.0, 24.0, 30.0, 34.0, 46.0, 47.0, 49.0, 55.0, 49.0, 59.0, 55.0, 58.0, 52.0, 37.0, 35.0, 39.0, 28.0, 43.0, 33.0, 23.0, 21.0, 21.0, 20.0, 7.0, 4.0, 8.0, 1.0, 8.0, 5.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-11.039276123046875, -10.732244491577148, -10.425213813781738, -10.118182182312012, -9.811151504516602, -9.504119873046875, -9.197089195251465, -8.890057563781738, -8.583026885986328, -8.275995254516602, -7.968964576721191, -7.661933422088623, -7.354902267456055, -7.047871112823486, -6.740839958190918, -6.433808326721191, -6.126777172088623, -5.819746017456055, -5.512714862823486, -5.205683708190918, -4.89865255355835, -4.591621398925781, -4.284589767456055, -3.9775588512420654, -3.670527696609497, -3.3634965419769287, -3.0564653873443604, -2.749433994293213, -2.4424028396606445, -2.135371685028076, -1.8283405303955078, -1.5213093757629395, -1.214278221130371, -0.9072470664978027, -0.6002158522605896, -0.29318463802337646, 0.013846516609191895, 0.32087767124176025, 0.6279089450836182, 0.9349400997161865, 1.2419712543487549, 1.5490024089813232, 1.8560335636138916, 2.163064956665039, 2.4700961112976074, 2.777127265930176, 3.084158420562744, 3.3911895751953125, 3.698220729827881, 4.005251884460449, 4.312283039093018, 4.619314193725586, 4.926345348358154, 5.233376502990723, 5.540408134460449, 5.847438812255859, 6.154470443725586, 6.461501598358154, 6.768532752990723, 7.075563907623291, 7.382595062255859, 7.689626216888428, 7.996657371520996, 8.303689002990723, 8.610719680786133]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 2.0, 4.0, 9.0, 10.0, 5.0, 9.0, 22.0, 28.0, 45.0, 83.0, 127.0, 222.0, 370.0, 760.0, 1398.0, 3137.0, 7238.0, 18420.0, 50847.0, 153870.0, 381970.0, 280231.0, 95131.0, 32760.0, 12184.0, 5114.0, 2258.0, 1047.0, 560.0, 270.0, 152.0, 112.0, 64.0, 35.0, 26.0, 12.0, 14.0, 4.0, 5.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.9775390625, -1.91900634765625, -1.8604736328125, -1.80194091796875, -1.743408203125, -1.68487548828125, -1.6263427734375, -1.56781005859375, -1.50927734375, -1.45074462890625, -1.3922119140625, -1.33367919921875, -1.275146484375, -1.21661376953125, -1.1580810546875, -1.09954833984375, -1.041015625, -0.98248291015625, -0.9239501953125, -0.86541748046875, -0.806884765625, -0.74835205078125, -0.6898193359375, -0.63128662109375, -0.57275390625, -0.51422119140625, -0.4556884765625, -0.39715576171875, -0.338623046875, -0.28009033203125, -0.2215576171875, -0.16302490234375, -0.1044921875, -0.04595947265625, 0.0125732421875, 0.07110595703125, 0.129638671875, 0.18817138671875, 0.2467041015625, 0.30523681640625, 0.36376953125, 0.42230224609375, 0.4808349609375, 0.53936767578125, 0.597900390625, 0.65643310546875, 0.7149658203125, 0.77349853515625, 0.83203125, 0.89056396484375, 0.9490966796875, 1.00762939453125, 1.066162109375, 1.12469482421875, 1.1832275390625, 1.24176025390625, 1.30029296875, 1.35882568359375, 1.4173583984375, 1.47589111328125, 1.534423828125, 1.59295654296875, 1.6514892578125, 1.71002197265625, 1.7685546875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 6.0, 1.0, 5.0, 8.0, 10.0, 17.0, 22.0, 33.0, 42.0, 48.0, 61.0, 67.0, 78.0, 113.0, 80.0, 86.0, 82.0, 67.0, 44.0, 50.0, 31.0, 19.0, 15.0, 7.0, 10.0, 6.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.779296875, -1.7284393310546875, -1.677581787109375, -1.6267242431640625, -1.57586669921875, -1.5250091552734375, -1.474151611328125, -1.4232940673828125, -1.3724365234375, -1.3215789794921875, -1.270721435546875, -1.2198638916015625, -1.16900634765625, -1.1181488037109375, -1.067291259765625, -1.0164337158203125, -0.965576171875, -0.9147186279296875, -0.863861083984375, -0.8130035400390625, -0.76214599609375, -0.7112884521484375, -0.660430908203125, -0.6095733642578125, -0.5587158203125, -0.5078582763671875, -0.457000732421875, -0.4061431884765625, -0.35528564453125, -0.3044281005859375, -0.253570556640625, -0.2027130126953125, -0.15185546875, -0.1009979248046875, -0.050140380859375, 0.0007171630859375, 0.05157470703125, 0.1024322509765625, 0.153289794921875, 0.2041473388671875, 0.2550048828125, 0.3058624267578125, 0.356719970703125, 0.4075775146484375, 0.45843505859375, 0.5092926025390625, 0.560150146484375, 0.6110076904296875, 0.661865234375, 0.7127227783203125, 0.763580322265625, 0.8144378662109375, 0.86529541015625, 0.9161529541015625, 0.967010498046875, 1.0178680419921875, 1.0687255859375, 1.1195831298828125, 1.170440673828125, 1.2212982177734375, 1.27215576171875, 1.3230133056640625, 1.373870849609375, 1.4247283935546875, 1.4755859375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 2.0, 8.0, 11.0, 13.0, 18.0, 17.0, 30.0, 59.0, 61.0, 94.0, 143.0, 201.0, 399.0, 703.0, 1519.0, 4191.0, 15835.0, 88121.0, 595014.0, 285102.0, 42752.0, 9047.0, 2773.0, 1107.0, 547.0, 290.0, 179.0, 104.0, 63.0, 47.0, 29.0, 21.0, 8.0, 8.0, 6.0, 7.0, 9.0, 3.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-2.93359375, -2.841339111328125, -2.74908447265625, -2.656829833984375, -2.5645751953125, -2.472320556640625, -2.38006591796875, -2.287811279296875, -2.195556640625, -2.103302001953125, -2.01104736328125, -1.918792724609375, -1.8265380859375, -1.734283447265625, -1.64202880859375, -1.549774169921875, -1.45751953125, -1.365264892578125, -1.27301025390625, -1.180755615234375, -1.0885009765625, -0.996246337890625, -0.90399169921875, -0.811737060546875, -0.719482421875, -0.627227783203125, -0.53497314453125, -0.442718505859375, -0.3504638671875, -0.258209228515625, -0.16595458984375, -0.073699951171875, 0.0185546875, 0.110809326171875, 0.20306396484375, 0.295318603515625, 0.3875732421875, 0.479827880859375, 0.57208251953125, 0.664337158203125, 0.756591796875, 0.848846435546875, 0.94110107421875, 1.033355712890625, 1.1256103515625, 1.217864990234375, 1.31011962890625, 1.402374267578125, 1.49462890625, 1.586883544921875, 1.67913818359375, 1.771392822265625, 1.8636474609375, 1.955902099609375, 2.04815673828125, 2.140411376953125, 2.232666015625, 2.324920654296875, 2.41717529296875, 2.509429931640625, 2.6016845703125, 2.693939208984375, 2.78619384765625, 2.878448486328125, 2.970703125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 1.0, 4.0, 9.0, 3.0, 0.0, 8.0, 5.0, 14.0, 6.0, 13.0, 12.0, 14.0, 16.0, 20.0, 25.0, 27.0, 26.0, 39.0, 39.0, 33.0, 53.0, 61.0, 43.0, 54.0, 47.0, 60.0, 50.0, 41.0, 50.0, 32.0, 25.0, 31.0, 33.0, 17.0, 13.0, 13.0, 16.0, 14.0, 8.0, 8.0, 6.0, 2.0, 3.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.451171875, -3.3446044921875, -3.238037109375, -3.1314697265625, -3.02490234375, -2.9183349609375, -2.811767578125, -2.7052001953125, -2.5986328125, -2.4920654296875, -2.385498046875, -2.2789306640625, -2.17236328125, -2.0657958984375, -1.959228515625, -1.8526611328125, -1.74609375, -1.6395263671875, -1.532958984375, -1.4263916015625, -1.31982421875, -1.2132568359375, -1.106689453125, -1.0001220703125, -0.8935546875, -0.7869873046875, -0.680419921875, -0.5738525390625, -0.46728515625, -0.3607177734375, -0.254150390625, -0.1475830078125, -0.041015625, 0.0655517578125, 0.172119140625, 0.2786865234375, 0.38525390625, 0.4918212890625, 0.598388671875, 0.7049560546875, 0.8115234375, 0.9180908203125, 1.024658203125, 1.1312255859375, 1.23779296875, 1.3443603515625, 1.450927734375, 1.5574951171875, 1.6640625, 1.7706298828125, 1.877197265625, 1.9837646484375, 2.09033203125, 2.1968994140625, 2.303466796875, 2.4100341796875, 2.5166015625, 2.6231689453125, 2.729736328125, 2.8363037109375, 2.94287109375, 3.0494384765625, 3.156005859375, 3.2625732421875, 3.369140625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 15.0, 25.0, 30.0, 93.0, 242.0, 1038.0, 11156.0, 936631.0, 96247.0, 2386.0, 430.0, 132.0, 47.0, 37.0, 16.0, 8.0, 7.0, 5.0, 3.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.677734375, -1.588165283203125, -1.49859619140625, -1.409027099609375, -1.3194580078125, -1.229888916015625, -1.14031982421875, -1.050750732421875, -0.961181640625, -0.871612548828125, -0.78204345703125, -0.692474365234375, -0.6029052734375, -0.513336181640625, -0.42376708984375, -0.334197998046875, -0.24462890625, -0.155059814453125, -0.06549072265625, 0.024078369140625, 0.1136474609375, 0.203216552734375, 0.29278564453125, 0.382354736328125, 0.471923828125, 0.561492919921875, 0.65106201171875, 0.740631103515625, 0.8302001953125, 0.919769287109375, 1.00933837890625, 1.098907470703125, 1.1884765625, 1.278045654296875, 1.36761474609375, 1.457183837890625, 1.5467529296875, 1.636322021484375, 1.72589111328125, 1.815460205078125, 1.905029296875, 1.994598388671875, 2.08416748046875, 2.173736572265625, 2.2633056640625, 2.352874755859375, 2.44244384765625, 2.532012939453125, 2.62158203125, 2.711151123046875, 2.80072021484375, 2.890289306640625, 2.9798583984375, 3.069427490234375, 3.15899658203125, 3.248565673828125, 3.338134765625, 3.427703857421875, 3.51727294921875, 3.606842041015625, 3.6964111328125, 3.785980224609375, 3.87554931640625, 3.965118408203125, 4.0546875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 1.0, 3.0, 1.0, 3.0, 3.0, 2.0, 5.0, 4.0, 8.0, 10.0, 14.0, 12.0, 14.0, 17.0, 35.0, 35.0, 46.0, 55.0, 48.0, 59.0, 56.0, 89.0, 60.0, 68.0, 57.0, 52.0, 40.0, 42.0, 24.0, 27.0, 21.0, 19.0, 12.0, 11.0, 11.0, 9.0, 8.0, 4.0, 0.0, 3.0, 2.0, 4.0, 1.0, 6.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.0001404285430908203, -0.00013588741421699524, -0.00013134628534317017, -0.0001268051564693451, -0.00012226402759552002, -0.00011772289872169495, -0.00011318176984786987, -0.0001086406409740448, -0.00010409951210021973, -9.955838322639465e-05, -9.501725435256958e-05, -9.047612547874451e-05, -8.593499660491943e-05, -8.139386773109436e-05, -7.685273885726929e-05, -7.231160998344421e-05, -6.777048110961914e-05, -6.322935223579407e-05, -5.8688223361968994e-05, -5.414709448814392e-05, -4.960596561431885e-05, -4.5064836740493774e-05, -4.05237078666687e-05, -3.598257899284363e-05, -3.1441450119018555e-05, -2.690032124519348e-05, -2.2359192371368408e-05, -1.7818063497543335e-05, -1.3276934623718262e-05, -8.735805749893188e-06, -4.194676876068115e-06, 3.46451997756958e-07, 4.887580871582031e-06, 9.428709745407104e-06, 1.3969838619232178e-05, 1.851096749305725e-05, 2.3052096366882324e-05, 2.7593225240707397e-05, 3.213435411453247e-05, 3.6675482988357544e-05, 4.121661186218262e-05, 4.575774073600769e-05, 5.0298869609832764e-05, 5.483999848365784e-05, 5.938112735748291e-05, 6.392225623130798e-05, 6.846338510513306e-05, 7.300451397895813e-05, 7.75456428527832e-05, 8.208677172660828e-05, 8.662790060043335e-05, 9.116902947425842e-05, 9.57101583480835e-05, 0.00010025128722190857, 0.00010479241609573364, 0.00010933354496955872, 0.00011387467384338379, 0.00011841580271720886, 0.00012295693159103394, 0.000127498060464859, 0.00013203918933868408, 0.00013658031821250916, 0.00014112144708633423, 0.0001456625759601593, 0.00015020370483398438]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 4.0, 3.0, 3.0, 5.0, 10.0, 13.0, 21.0, 41.0, 51.0, 71.0, 157.0, 271.0, 621.0, 1441.0, 4864.0, 34892.0, 689701.0, 294675.0, 16544.0, 3118.0, 1022.0, 467.0, 227.0, 114.0, 80.0, 49.0, 40.0, 20.0, 10.0, 9.0, 5.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.560546875, -1.5157623291015625, -1.470977783203125, -1.4261932373046875, -1.38140869140625, -1.3366241455078125, -1.291839599609375, -1.2470550537109375, -1.2022705078125, -1.1574859619140625, -1.112701416015625, -1.0679168701171875, -1.02313232421875, -0.9783477783203125, -0.933563232421875, -0.8887786865234375, -0.843994140625, -0.7992095947265625, -0.754425048828125, -0.7096405029296875, -0.66485595703125, -0.6200714111328125, -0.575286865234375, -0.5305023193359375, -0.4857177734375, -0.4409332275390625, -0.396148681640625, -0.3513641357421875, -0.30657958984375, -0.2617950439453125, -0.217010498046875, -0.1722259521484375, -0.12744140625, -0.0826568603515625, -0.037872314453125, 0.0069122314453125, 0.05169677734375, 0.0964813232421875, 0.141265869140625, 0.1860504150390625, 0.2308349609375, 0.2756195068359375, 0.320404052734375, 0.3651885986328125, 0.40997314453125, 0.4547576904296875, 0.499542236328125, 0.5443267822265625, 0.589111328125, 0.6338958740234375, 0.678680419921875, 0.7234649658203125, 0.76824951171875, 0.8130340576171875, 0.857818603515625, 0.9026031494140625, 0.9473876953125, 0.9921722412109375, 1.036956787109375, 1.0817413330078125, 1.12652587890625, 1.1713104248046875, 1.216094970703125, 1.2608795166015625, 1.3056640625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 2.0, 8.0, 7.0, 15.0, 33.0, 33.0, 60.0, 81.0, 81.0, 118.0, 126.0, 113.0, 104.0, 80.0, 57.0, 35.0, 21.0, 14.0, 8.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.17578125, -1.129730224609375, -1.08367919921875, -1.037628173828125, -0.9915771484375, -0.945526123046875, -0.89947509765625, -0.853424072265625, -0.807373046875, -0.761322021484375, -0.71527099609375, -0.669219970703125, -0.6231689453125, -0.577117919921875, -0.53106689453125, -0.485015869140625, -0.43896484375, -0.392913818359375, -0.34686279296875, -0.300811767578125, -0.2547607421875, -0.208709716796875, -0.16265869140625, -0.116607666015625, -0.070556640625, -0.024505615234375, 0.02154541015625, 0.067596435546875, 0.1136474609375, 0.159698486328125, 0.20574951171875, 0.251800537109375, 0.2978515625, 0.343902587890625, 0.38995361328125, 0.436004638671875, 0.4820556640625, 0.528106689453125, 0.57415771484375, 0.620208740234375, 0.666259765625, 0.712310791015625, 0.75836181640625, 0.804412841796875, 0.8504638671875, 0.896514892578125, 0.94256591796875, 0.988616943359375, 1.03466796875, 1.080718994140625, 1.12677001953125, 1.172821044921875, 1.2188720703125, 1.264923095703125, 1.31097412109375, 1.357025146484375, 1.403076171875, 1.449127197265625, 1.49517822265625, 1.541229248046875, 1.5872802734375, 1.633331298828125, 1.67938232421875, 1.725433349609375, 1.771484375]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 7.0, 22.0, 65.0, 94.0, 209.0, 289.0, 167.0, 99.0, 26.0, 8.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-44.257118225097656, -43.23796463012695, -42.218814849853516, -41.19966125488281, -40.180511474609375, -39.16135787963867, -38.14220428466797, -37.12305450439453, -36.10390090942383, -35.084747314453125, -34.06559753417969, -33.046443939208984, -32.02729034423828, -31.008140563964844, -29.98898696899414, -28.96983528137207, -27.95068359375, -26.93153190612793, -25.91238021850586, -24.893226623535156, -23.874074935913086, -22.854923248291016, -21.835769653320312, -20.816617965698242, -19.797466278076172, -18.7783145904541, -17.75916290283203, -16.740009307861328, -15.720857620239258, -14.701705932617188, -13.6825532913208, -12.663400650024414, -11.644245147705078, -10.625093460083008, -9.605940818786621, -8.586788177490234, -7.567636489868164, -6.5484843254089355, -5.529332160949707, -4.5101799964904785, -3.49102783203125, -2.4718756675720215, -1.452723503112793, -0.43357133865356445, 0.5855808258056641, 1.6047329902648926, 2.623885154724121, 3.6430373191833496, 4.662189483642578, 5.681341648101807, 6.700493812561035, 7.719645977020264, 8.738798141479492, 9.757949829101562, 10.77710247039795, 11.796255111694336, 12.815406799316406, 13.834558486938477, 14.853711128234863, 15.87286376953125, 16.89201545715332, 17.91116714477539, 18.930320739746094, 19.949472427368164, 20.968624114990234]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 5.0, 4.0, 8.0, 11.0, 16.0, 27.0, 27.0, 27.0, 39.0, 60.0, 61.0, 62.0, 69.0, 96.0, 99.0, 65.0, 61.0, 52.0, 52.0, 35.0, 45.0, 35.0, 13.0, 21.0, 8.0, 8.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.88585662841797, -20.139802932739258, -19.393747329711914, -18.647693634033203, -17.90163803100586, -17.15558433532715, -16.409530639648438, -15.66347599029541, -14.917421340942383, -14.171366691589355, -13.425312042236328, -12.679258346557617, -11.93320369720459, -11.187149047851562, -10.441095352172852, -9.695040702819824, -8.948986053466797, -8.20293140411377, -7.4568772315979, -6.710823059082031, -5.964768409729004, -5.218713760375977, -4.472659587860107, -3.7266054153442383, -2.980550765991211, -2.2344963550567627, -1.4884419441223145, -0.7423875331878662, 0.0036668777465820312, 0.7497212886810303, 1.4957756996154785, 2.2418298721313477, 2.987882614135742, 3.7339370250701904, 4.479991436004639, 5.226045608520508, 5.972100257873535, 6.7181549072265625, 7.464209079742432, 8.2102632522583, 8.956317901611328, 9.702372550964355, 10.448427200317383, 11.194480895996094, 11.940535545349121, 12.686590194702148, 13.43264389038086, 14.178698539733887, 14.924753189086914, 15.670807838439941, 16.41686248779297, 17.16291618347168, 17.90896987915039, 18.655025482177734, 19.401079177856445, 20.147132873535156, 20.8931884765625, 21.63924217224121, 22.385297775268555, 23.131351470947266, 23.87740707397461, 24.62346076965332, 25.36951446533203, 26.115570068359375, 26.861623764038086]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 8.0, 4.0, 10.0, 19.0, 31.0, 48.0, 80.0, 130.0, 252.0, 559.0, 1200.0, 3149.0, 10871.0, 55866.0, 743970.0, 3059850.0, 278162.0, 29675.0, 6513.0, 2050.0, 863.0, 432.0, 210.0, 118.0, 81.0, 42.0, 30.0, 22.0, 10.0, 9.0, 6.0, 5.0, 5.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.306640625, -1.25506591796875, -1.2034912109375, -1.15191650390625, -1.100341796875, -1.04876708984375, -0.9971923828125, -0.94561767578125, -0.89404296875, -0.84246826171875, -0.7908935546875, -0.73931884765625, -0.687744140625, -0.63616943359375, -0.5845947265625, -0.53302001953125, -0.4814453125, -0.42987060546875, -0.3782958984375, -0.32672119140625, -0.275146484375, -0.22357177734375, -0.1719970703125, -0.12042236328125, -0.06884765625, -0.01727294921875, 0.0343017578125, 0.08587646484375, 0.137451171875, 0.18902587890625, 0.2406005859375, 0.29217529296875, 0.34375, 0.39532470703125, 0.4468994140625, 0.49847412109375, 0.550048828125, 0.60162353515625, 0.6531982421875, 0.70477294921875, 0.75634765625, 0.80792236328125, 0.8594970703125, 0.91107177734375, 0.962646484375, 1.01422119140625, 1.0657958984375, 1.11737060546875, 1.1689453125, 1.22052001953125, 1.2720947265625, 1.32366943359375, 1.375244140625, 1.42681884765625, 1.4783935546875, 1.52996826171875, 1.58154296875, 1.63311767578125, 1.6846923828125, 1.73626708984375, 1.787841796875, 1.83941650390625, 1.8909912109375, 1.94256591796875, 1.994140625]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 5.0, 2.0, 4.0, 9.0, 16.0, 20.0, 29.0, 37.0, 46.0, 52.0, 54.0, 59.0, 83.0, 80.0, 78.0, 73.0, 67.0, 67.0, 55.0, 48.0, 35.0, 19.0, 23.0, 11.0, 12.0, 8.0, 2.0, 4.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.99365234375, -0.9523696899414062, -0.9110870361328125, -0.8698043823242188, -0.828521728515625, -0.7872390747070312, -0.7459564208984375, -0.7046737670898438, -0.66339111328125, -0.6221084594726562, -0.5808258056640625, -0.5395431518554688, -0.498260498046875, -0.45697784423828125, -0.4156951904296875, -0.37441253662109375, -0.3331298828125, -0.29184722900390625, -0.2505645751953125, -0.20928192138671875, -0.167999267578125, -0.12671661376953125, -0.0854339599609375, -0.04415130615234375, -0.00286865234375, 0.03841400146484375, 0.0796966552734375, 0.12097930908203125, 0.162261962890625, 0.20354461669921875, 0.2448272705078125, 0.28610992431640625, 0.327392578125, 0.36867523193359375, 0.4099578857421875, 0.45124053955078125, 0.492523193359375, 0.5338058471679688, 0.5750885009765625, 0.6163711547851562, 0.65765380859375, 0.6989364624023438, 0.7402191162109375, 0.7815017700195312, 0.822784423828125, 0.8640670776367188, 0.9053497314453125, 0.9466323852539062, 0.9879150390625, 1.0291976928710938, 1.0704803466796875, 1.1117630004882812, 1.153045654296875, 1.1943283081054688, 1.2356109619140625, 1.2768936157226562, 1.31817626953125, 1.3594589233398438, 1.4007415771484375, 1.4420242309570312, 1.483306884765625, 1.5245895385742188, 1.5658721923828125, 1.6071548461914062, 1.6484375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 3.0, 3.0, 8.0, 15.0, 22.0, 25.0, 38.0, 42.0, 73.0, 124.0, 243.0, 464.0, 999.0, 2495.0, 7320.0, 30758.0, 253667.0, 3533940.0, 319314.0, 32899.0, 7294.0, 2398.0, 979.0, 512.0, 246.0, 150.0, 76.0, 64.0, 28.0, 14.0, 18.0, 14.0, 9.0, 5.0, 8.0, 6.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.232421875, -2.159332275390625, -2.08624267578125, -2.013153076171875, -1.9400634765625, -1.866973876953125, -1.79388427734375, -1.720794677734375, -1.647705078125, -1.574615478515625, -1.50152587890625, -1.428436279296875, -1.3553466796875, -1.282257080078125, -1.20916748046875, -1.136077880859375, -1.06298828125, -0.989898681640625, -0.91680908203125, -0.843719482421875, -0.7706298828125, -0.697540283203125, -0.62445068359375, -0.551361083984375, -0.478271484375, -0.405181884765625, -0.33209228515625, -0.259002685546875, -0.1859130859375, -0.112823486328125, -0.03973388671875, 0.033355712890625, 0.1064453125, 0.179534912109375, 0.25262451171875, 0.325714111328125, 0.3988037109375, 0.471893310546875, 0.54498291015625, 0.618072509765625, 0.691162109375, 0.764251708984375, 0.83734130859375, 0.910430908203125, 0.9835205078125, 1.056610107421875, 1.12969970703125, 1.202789306640625, 1.27587890625, 1.348968505859375, 1.42205810546875, 1.495147705078125, 1.5682373046875, 1.641326904296875, 1.71441650390625, 1.787506103515625, 1.860595703125, 1.933685302734375, 2.00677490234375, 2.079864501953125, 2.1529541015625, 2.226043701171875, 2.29913330078125, 2.372222900390625, 2.4453125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 9.0, 7.0, 5.0, 13.0, 25.0, 23.0, 43.0, 59.0, 100.0, 164.0, 315.0, 711.0, 1014.0, 737.0, 376.0, 178.0, 110.0, 69.0, 40.0, 26.0, 12.0, 9.0, 3.0, 5.0, 3.0, 8.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-3.189453125, -3.09735107421875, -3.0052490234375, -2.91314697265625, -2.821044921875, -2.72894287109375, -2.6368408203125, -2.54473876953125, -2.45263671875, -2.36053466796875, -2.2684326171875, -2.17633056640625, -2.084228515625, -1.99212646484375, -1.9000244140625, -1.80792236328125, -1.7158203125, -1.62371826171875, -1.5316162109375, -1.43951416015625, -1.347412109375, -1.25531005859375, -1.1632080078125, -1.07110595703125, -0.97900390625, -0.88690185546875, -0.7947998046875, -0.70269775390625, -0.610595703125, -0.51849365234375, -0.4263916015625, -0.33428955078125, -0.2421875, -0.15008544921875, -0.0579833984375, 0.03411865234375, 0.126220703125, 0.21832275390625, 0.3104248046875, 0.40252685546875, 0.49462890625, 0.58673095703125, 0.6788330078125, 0.77093505859375, 0.863037109375, 0.95513916015625, 1.0472412109375, 1.13934326171875, 1.2314453125, 1.32354736328125, 1.4156494140625, 1.50775146484375, 1.599853515625, 1.69195556640625, 1.7840576171875, 1.87615966796875, 1.96826171875, 2.06036376953125, 2.1524658203125, 2.24456787109375, 2.336669921875, 2.42877197265625, 2.5208740234375, 2.61297607421875, 2.705078125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 3.0, 4.0, 9.0, 13.0, 22.0, 33.0, 109.0, 202.0, 257.0, 173.0, 105.0, 37.0, 15.0, 5.0, 1.0, 3.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.569122314453125, -23.75977325439453, -22.950424194335938, -22.141075134277344, -21.33172607421875, -20.522377014160156, -19.71302604675293, -18.903676986694336, -18.094327926635742, -17.28497886657715, -16.475629806518555, -15.666279792785645, -14.85693073272705, -14.047581672668457, -13.238231658935547, -12.428882598876953, -11.61953353881836, -10.810184478759766, -10.000835418701172, -9.191485404968262, -8.382136344909668, -7.572787284851074, -6.763437747955322, -5.95408821105957, -5.144739151000977, -4.335390090942383, -3.526040554046631, -2.716691255569458, -1.9073419570922852, -1.0979928970336914, -0.28864336013793945, 0.5207061767578125, 1.330057144165039, 2.139406442642212, 2.9487557411193848, 3.7581050395965576, 4.5674543380737305, 5.376803398132324, 6.186152935028076, 6.995502471923828, 7.804851531982422, 8.614200592041016, 9.42354965209961, 10.23289966583252, 11.042248725891113, 11.851597785949707, 12.660947799682617, 13.470296859741211, 14.279645919799805, 15.088994979858398, 15.898344039916992, 16.707693099975586, 17.517044067382812, 18.326393127441406, 19.1357421875, 19.945091247558594, 20.754440307617188, 21.56378936767578, 22.373138427734375, 23.18248748779297, 23.991836547851562, 24.801185607910156, 25.610536575317383, 26.419885635375977, 27.22923469543457]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 4.0, 2.0, 9.0, 5.0, 10.0, 14.0, 16.0, 16.0, 14.0, 15.0, 28.0, 20.0, 32.0, 26.0, 28.0, 37.0, 38.0, 40.0, 48.0, 43.0, 38.0, 51.0, 49.0, 45.0, 48.0, 39.0, 36.0, 35.0, 29.0, 27.0, 36.0, 26.0, 19.0, 15.0, 15.0, 10.0, 7.0, 6.0, 4.0, 3.0, 4.0, 4.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.81758975982666, -10.494715690612793, -10.17184066772461, -9.848966598510742, -9.526092529296875, -9.203218460083008, -8.880343437194824, -8.557469367980957, -8.23459529876709, -7.9117207527160645, -7.588846683502197, -7.265972137451172, -6.943098068237305, -6.620223522186279, -6.297348976135254, -5.974474906921387, -5.651600360870361, -5.328725814819336, -5.005851745605469, -4.682977199554443, -4.360103130340576, -4.037228584289551, -3.7143542766571045, -3.391479969024658, -3.068605661392212, -2.7457313537597656, -2.4228570461273193, -2.099982738494873, -1.7771083116531372, -1.454234004020691, -1.131359577178955, -0.8084852695465088, -0.4856109619140625, -0.16273662447929382, 0.16013771295547485, 0.4830120801925659, 0.8058863878250122, 1.1287606954574585, 1.4516351222991943, 1.7745094299316406, 2.097383737564087, 2.420258045196533, 2.7431323528289795, 3.066006660461426, 3.388881206512451, 3.7117552757263184, 4.034629821777344, 4.357503890991211, 4.680378437042236, 5.003252983093262, 5.326127052307129, 5.649001598358154, 5.9718756675720215, 6.294750213623047, 6.617624282836914, 6.9404988288879395, 7.263373374938965, 7.58624792098999, 7.909121990203857, 8.231996536254883, 8.55487060546875, 8.877744674682617, 9.2006196975708, 9.523493766784668, 9.846367835998535]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 7.0, 6.0, 11.0, 12.0, 19.0, 26.0, 65.0, 90.0, 165.0, 246.0, 422.0, 742.0, 1656.0, 3257.0, 7405.0, 17309.0, 42954.0, 106416.0, 234440.0, 311552.0, 185660.0, 80064.0, 31923.0, 13000.0, 5614.0, 2630.0, 1261.0, 695.0, 371.0, 208.0, 134.0, 64.0, 57.0, 34.0, 17.0, 9.0, 7.0, 3.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3076171875, -1.267181396484375, -1.22674560546875, -1.186309814453125, -1.1458740234375, -1.105438232421875, -1.06500244140625, -1.024566650390625, -0.984130859375, -0.943695068359375, -0.90325927734375, -0.862823486328125, -0.8223876953125, -0.781951904296875, -0.74151611328125, -0.701080322265625, -0.66064453125, -0.620208740234375, -0.57977294921875, -0.539337158203125, -0.4989013671875, -0.458465576171875, -0.41802978515625, -0.377593994140625, -0.337158203125, -0.296722412109375, -0.25628662109375, -0.215850830078125, -0.1754150390625, -0.134979248046875, -0.09454345703125, -0.054107666015625, -0.013671875, 0.026763916015625, 0.06719970703125, 0.107635498046875, 0.1480712890625, 0.188507080078125, 0.22894287109375, 0.269378662109375, 0.309814453125, 0.350250244140625, 0.39068603515625, 0.431121826171875, 0.4715576171875, 0.511993408203125, 0.55242919921875, 0.592864990234375, 0.63330078125, 0.673736572265625, 0.71417236328125, 0.754608154296875, 0.7950439453125, 0.835479736328125, 0.87591552734375, 0.916351318359375, 0.956787109375, 0.997222900390625, 1.03765869140625, 1.078094482421875, 1.1185302734375, 1.158966064453125, 1.19940185546875, 1.239837646484375, 1.2802734375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 0.0, 3.0, 3.0, 1.0, 6.0, 13.0, 10.0, 14.0, 13.0, 19.0, 32.0, 21.0, 55.0, 39.0, 42.0, 54.0, 49.0, 58.0, 61.0, 67.0, 55.0, 51.0, 55.0, 45.0, 35.0, 35.0, 30.0, 32.0, 22.0, 19.0, 12.0, 16.0, 7.0, 9.0, 5.0, 7.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-1.0615234375, -1.0304412841796875, -0.999359130859375, -0.9682769775390625, -0.93719482421875, -0.9061126708984375, -0.875030517578125, -0.8439483642578125, -0.8128662109375, -0.7817840576171875, -0.750701904296875, -0.7196197509765625, -0.68853759765625, -0.6574554443359375, -0.626373291015625, -0.5952911376953125, -0.564208984375, -0.5331268310546875, -0.502044677734375, -0.4709625244140625, -0.43988037109375, -0.4087982177734375, -0.377716064453125, -0.3466339111328125, -0.3155517578125, -0.2844696044921875, -0.253387451171875, -0.2223052978515625, -0.19122314453125, -0.1601409912109375, -0.129058837890625, -0.0979766845703125, -0.06689453125, -0.0358123779296875, -0.004730224609375, 0.0263519287109375, 0.05743408203125, 0.0885162353515625, 0.119598388671875, 0.1506805419921875, 0.1817626953125, 0.2128448486328125, 0.243927001953125, 0.2750091552734375, 0.30609130859375, 0.3371734619140625, 0.368255615234375, 0.3993377685546875, 0.430419921875, 0.4615020751953125, 0.492584228515625, 0.5236663818359375, 0.55474853515625, 0.5858306884765625, 0.616912841796875, 0.6479949951171875, 0.6790771484375, 0.7101593017578125, 0.741241455078125, 0.7723236083984375, 0.80340576171875, 0.8344879150390625, 0.865570068359375, 0.8966522216796875, 0.927734375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 6.0, 3.0, 7.0, 8.0, 14.0, 14.0, 24.0, 37.0, 40.0, 59.0, 106.0, 128.0, 183.0, 263.0, 377.0, 586.0, 1020.0, 2016.0, 5548.0, 26407.0, 253199.0, 672252.0, 69672.0, 10071.0, 2979.0, 1276.0, 720.0, 457.0, 305.0, 186.0, 149.0, 127.0, 77.0, 63.0, 54.0, 30.0, 23.0, 16.0, 11.0, 15.0, 12.0, 10.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0], "bins": [-3.125, -3.03094482421875, -2.9368896484375, -2.84283447265625, -2.748779296875, -2.65472412109375, -2.5606689453125, -2.46661376953125, -2.37255859375, -2.27850341796875, -2.1844482421875, -2.09039306640625, -1.996337890625, -1.90228271484375, -1.8082275390625, -1.71417236328125, -1.6201171875, -1.52606201171875, -1.4320068359375, -1.33795166015625, -1.243896484375, -1.14984130859375, -1.0557861328125, -0.96173095703125, -0.86767578125, -0.77362060546875, -0.6795654296875, -0.58551025390625, -0.491455078125, -0.39739990234375, -0.3033447265625, -0.20928955078125, -0.115234375, -0.02117919921875, 0.0728759765625, 0.16693115234375, 0.260986328125, 0.35504150390625, 0.4490966796875, 0.54315185546875, 0.63720703125, 0.73126220703125, 0.8253173828125, 0.91937255859375, 1.013427734375, 1.10748291015625, 1.2015380859375, 1.29559326171875, 1.3896484375, 1.48370361328125, 1.5777587890625, 1.67181396484375, 1.765869140625, 1.85992431640625, 1.9539794921875, 2.04803466796875, 2.14208984375, 2.23614501953125, 2.3302001953125, 2.42425537109375, 2.518310546875, 2.61236572265625, 2.7064208984375, 2.80047607421875, 2.89453125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 9.0, 6.0, 10.0, 12.0, 14.0, 7.0, 11.0, 13.0, 31.0, 25.0, 41.0, 31.0, 37.0, 47.0, 37.0, 30.0, 47.0, 42.0, 53.0, 41.0, 41.0, 31.0, 39.0, 32.0, 37.0, 37.0, 26.0, 41.0, 22.0, 22.0, 18.0, 19.0, 15.0, 11.0, 5.0, 11.0, 10.0, 7.0, 7.0, 6.0, 5.0, 2.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0], "bins": [-3.427734375, -3.32080078125, -3.2138671875, -3.10693359375, -3.0, -2.89306640625, -2.7861328125, -2.67919921875, -2.572265625, -2.46533203125, -2.3583984375, -2.25146484375, -2.14453125, -2.03759765625, -1.9306640625, -1.82373046875, -1.716796875, -1.60986328125, -1.5029296875, -1.39599609375, -1.2890625, -1.18212890625, -1.0751953125, -0.96826171875, -0.861328125, -0.75439453125, -0.6474609375, -0.54052734375, -0.43359375, -0.32666015625, -0.2197265625, -0.11279296875, -0.005859375, 0.10107421875, 0.2080078125, 0.31494140625, 0.421875, 0.52880859375, 0.6357421875, 0.74267578125, 0.849609375, 0.95654296875, 1.0634765625, 1.17041015625, 1.27734375, 1.38427734375, 1.4912109375, 1.59814453125, 1.705078125, 1.81201171875, 1.9189453125, 2.02587890625, 2.1328125, 2.23974609375, 2.3466796875, 2.45361328125, 2.560546875, 2.66748046875, 2.7744140625, 2.88134765625, 2.98828125, 3.09521484375, 3.2021484375, 3.30908203125, 3.416015625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 1.0, 2.0, 2.0, 3.0, 5.0, 2.0, 9.0, 27.0, 42.0, 75.0, 222.0, 536.0, 2536.0, 41220.0, 941287.0, 58537.0, 3031.0, 645.0, 206.0, 80.0, 35.0, 19.0, 11.0, 5.0, 7.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.638671875, -1.58502197265625, -1.5313720703125, -1.47772216796875, -1.424072265625, -1.37042236328125, -1.3167724609375, -1.26312255859375, -1.20947265625, -1.15582275390625, -1.1021728515625, -1.04852294921875, -0.994873046875, -0.94122314453125, -0.8875732421875, -0.83392333984375, -0.7802734375, -0.72662353515625, -0.6729736328125, -0.61932373046875, -0.565673828125, -0.51202392578125, -0.4583740234375, -0.40472412109375, -0.35107421875, -0.29742431640625, -0.2437744140625, -0.19012451171875, -0.136474609375, -0.08282470703125, -0.0291748046875, 0.02447509765625, 0.078125, 0.13177490234375, 0.1854248046875, 0.23907470703125, 0.292724609375, 0.34637451171875, 0.4000244140625, 0.45367431640625, 0.50732421875, 0.56097412109375, 0.6146240234375, 0.66827392578125, 0.721923828125, 0.77557373046875, 0.8292236328125, 0.88287353515625, 0.9365234375, 0.99017333984375, 1.0438232421875, 1.09747314453125, 1.151123046875, 1.20477294921875, 1.2584228515625, 1.31207275390625, 1.36572265625, 1.41937255859375, 1.4730224609375, 1.52667236328125, 1.580322265625, 1.63397216796875, 1.6876220703125, 1.74127197265625, 1.794921875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 9.0, 9.0, 25.0, 17.0, 27.0, 47.0, 47.0, 92.0, 130.0, 117.0, 134.0, 94.0, 68.0, 49.0, 37.0, 24.0, 23.0, 17.0, 12.0, 4.0, 8.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0003330707550048828, -0.00032491981983184814, -0.0003167688846588135, -0.0003086179494857788, -0.00030046701431274414, -0.00029231607913970947, -0.0002841651439666748, -0.00027601420879364014, -0.00026786327362060547, -0.0002597123384475708, -0.00025156140327453613, -0.00024341046810150146, -0.0002352595329284668, -0.00022710859775543213, -0.00021895766258239746, -0.0002108067274093628, -0.00020265579223632812, -0.00019450485706329346, -0.0001863539218902588, -0.00017820298671722412, -0.00017005205154418945, -0.00016190111637115479, -0.00015375018119812012, -0.00014559924602508545, -0.00013744831085205078, -0.0001292973756790161, -0.00012114644050598145, -0.00011299550533294678, -0.00010484457015991211, -9.669363498687744e-05, -8.854269981384277e-05, -8.03917646408081e-05, -7.224082946777344e-05, -6.408989429473877e-05, -5.59389591217041e-05, -4.7788023948669434e-05, -3.9637088775634766e-05, -3.14861536026001e-05, -2.333521842956543e-05, -1.5184283256530762e-05, -7.033348083496094e-06, 1.1175870895385742e-06, 9.268522262573242e-06, 1.741945743560791e-05, 2.5570392608642578e-05, 3.3721327781677246e-05, 4.1872262954711914e-05, 5.002319812774658e-05, 5.817413330078125e-05, 6.632506847381592e-05, 7.447600364685059e-05, 8.262693881988525e-05, 9.077787399291992e-05, 9.892880916595459e-05, 0.00010707974433898926, 0.00011523067951202393, 0.0001233816146850586, 0.00013153254985809326, 0.00013968348503112793, 0.0001478344202041626, 0.00015598535537719727, 0.00016413629055023193, 0.0001722872257232666, 0.00018043816089630127, 0.00018858909606933594]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 7.0, 9.0, 17.0, 17.0, 36.0, 53.0, 108.0, 217.0, 429.0, 977.0, 2664.0, 13423.0, 196161.0, 778581.0, 47242.0, 5775.0, 1572.0, 599.0, 297.0, 161.0, 85.0, 57.0, 20.0, 24.0, 8.0, 8.0, 3.0, 2.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3173828125, -1.2838287353515625, -1.250274658203125, -1.2167205810546875, -1.18316650390625, -1.1496124267578125, -1.116058349609375, -1.0825042724609375, -1.0489501953125, -1.0153961181640625, -0.981842041015625, -0.9482879638671875, -0.91473388671875, -0.8811798095703125, -0.847625732421875, -0.8140716552734375, -0.780517578125, -0.7469635009765625, -0.713409423828125, -0.6798553466796875, -0.64630126953125, -0.6127471923828125, -0.579193115234375, -0.5456390380859375, -0.5120849609375, -0.4785308837890625, -0.444976806640625, -0.4114227294921875, -0.37786865234375, -0.3443145751953125, -0.310760498046875, -0.2772064208984375, -0.24365234375, -0.2100982666015625, -0.176544189453125, -0.1429901123046875, -0.10943603515625, -0.0758819580078125, -0.042327880859375, -0.0087738037109375, 0.0247802734375, 0.0583343505859375, 0.091888427734375, 0.1254425048828125, 0.15899658203125, 0.1925506591796875, 0.226104736328125, 0.2596588134765625, 0.293212890625, 0.3267669677734375, 0.360321044921875, 0.3938751220703125, 0.42742919921875, 0.4609832763671875, 0.494537353515625, 0.5280914306640625, 0.5616455078125, 0.5951995849609375, 0.628753662109375, 0.6623077392578125, 0.69586181640625, 0.7294158935546875, 0.762969970703125, 0.7965240478515625, 0.830078125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 3.0, 5.0, 8.0, 4.0, 10.0, 9.0, 10.0, 17.0, 21.0, 31.0, 39.0, 34.0, 41.0, 55.0, 72.0, 66.0, 63.0, 75.0, 59.0, 59.0, 55.0, 46.0, 44.0, 35.0, 34.0, 18.0, 16.0, 15.0, 12.0, 8.0, 4.0, 10.0, 4.0, 8.0, 2.0, 7.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.68603515625, -0.6647186279296875, -0.643402099609375, -0.6220855712890625, -0.60076904296875, -0.5794525146484375, -0.558135986328125, -0.5368194580078125, -0.5155029296875, -0.4941864013671875, -0.472869873046875, -0.4515533447265625, -0.43023681640625, -0.4089202880859375, -0.387603759765625, -0.3662872314453125, -0.344970703125, -0.3236541748046875, -0.302337646484375, -0.2810211181640625, -0.25970458984375, -0.2383880615234375, -0.217071533203125, -0.1957550048828125, -0.1744384765625, -0.1531219482421875, -0.131805419921875, -0.1104888916015625, -0.08917236328125, -0.0678558349609375, -0.046539306640625, -0.0252227783203125, -0.00390625, 0.0174102783203125, 0.038726806640625, 0.0600433349609375, 0.08135986328125, 0.1026763916015625, 0.123992919921875, 0.1453094482421875, 0.1666259765625, 0.1879425048828125, 0.209259033203125, 0.2305755615234375, 0.25189208984375, 0.2732086181640625, 0.294525146484375, 0.3158416748046875, 0.337158203125, 0.3584747314453125, 0.379791259765625, 0.4011077880859375, 0.42242431640625, 0.4437408447265625, 0.465057373046875, 0.4863739013671875, 0.5076904296875, 0.5290069580078125, 0.550323486328125, 0.5716400146484375, 0.59295654296875, 0.6142730712890625, 0.635589599609375, 0.6569061279296875, 0.67822265625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 7.0, 6.0, 7.0, 11.0, 29.0, 33.0, 90.0, 154.0, 215.0, 213.0, 117.0, 55.0, 39.0, 10.0, 7.0, 6.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.04113006591797, -19.432435989379883, -18.823741912841797, -18.215045928955078, -17.606351852416992, -16.997657775878906, -16.38896369934082, -15.780268669128418, -15.171573638916016, -14.56287956237793, -13.954184532165527, -13.345490455627441, -12.736795425415039, -12.128101348876953, -11.519407272338867, -10.910712242126465, -10.302018165588379, -9.693324089050293, -9.08462905883789, -8.475934982299805, -7.867239952087402, -7.258545875549316, -6.649851322174072, -6.041156768798828, -5.432462215423584, -4.82376766204834, -4.215073108673096, -3.6063787937164307, -2.9976842403411865, -2.3889896869659424, -1.7802953720092773, -1.1716008186340332, -0.5629062652587891, 0.0457882285118103, 0.6544827222824097, 1.2631771564483643, 1.8718717098236084, 2.4805662631988525, 3.0892605781555176, 3.6979551315307617, 4.306649684906006, 4.91534423828125, 5.524038791656494, 6.132733345031738, 6.741427421569824, 7.350122451782227, 7.9588165283203125, 8.567510604858398, 9.1762056350708, 9.784899711608887, 10.393594741821289, 11.002288818359375, 11.610983848571777, 12.219677925109863, 12.828372955322266, 13.437067031860352, 14.045761108398438, 14.654455184936523, 15.263150215148926, 15.871844291687012, 16.480539321899414, 17.0892333984375, 17.697927474975586, 18.306621551513672, 18.91531753540039]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 2.0, 0.0, 4.0, 6.0, 8.0, 18.0, 11.0, 24.0, 21.0, 32.0, 42.0, 37.0, 33.0, 71.0, 60.0, 89.0, 116.0, 74.0, 64.0, 43.0, 50.0, 56.0, 32.0, 32.0, 23.0, 14.0, 11.0, 11.0, 8.0, 4.0, 3.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-26.731983184814453, -26.08621597290039, -25.440446853637695, -24.794679641723633, -24.14891242980957, -23.503145217895508, -22.857376098632812, -22.21160888671875, -21.565841674804688, -20.920074462890625, -20.27430534362793, -19.628538131713867, -18.982770919799805, -18.337003707885742, -17.691234588623047, -17.045467376708984, -16.399700164794922, -15.753931999206543, -15.10816478729248, -14.462396621704102, -13.816629409790039, -13.17086124420166, -12.525093078613281, -11.879325866699219, -11.233556747436523, -10.587788581848145, -9.942021369934082, -9.296253204345703, -8.65048599243164, -8.004717826843262, -7.358950138092041, -6.71318244934082, -6.067415237426758, -5.421647548675537, -4.775879859924316, -4.1301116943359375, -3.484344244003296, -2.838576555252075, -2.1928086280822754, -1.5470409393310547, -0.901273250579834, -0.2555055022239685, 0.390262246131897, 1.0360300540924072, 1.681797742843628, 2.3275654315948486, 2.9733333587646484, 3.619101047515869, 4.26486873626709, 4.9106364250183105, 5.556404113769531, 6.20217227935791, 6.847939491271973, 7.493707656860352, 8.139474868774414, 8.785243034362793, 9.431011199951172, 10.07677936553955, 10.722546577453613, 11.368314743041992, 12.014081954956055, 12.659850120544434, 13.305618286132812, 13.951385498046875, 14.597152709960938]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 4.0, 2.0, 6.0, 5.0, 7.0, 8.0, 12.0, 17.0, 13.0, 29.0, 57.0, 90.0, 141.0, 304.0, 548.0, 1106.0, 2600.0, 7023.0, 24979.0, 126243.0, 919856.0, 2500677.0, 503236.0, 77142.0, 18822.0, 6155.0, 2586.0, 1265.0, 633.0, 352.0, 174.0, 88.0, 42.0, 32.0, 8.0, 13.0, 9.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.3505859375, -1.3171234130859375, -1.283660888671875, -1.2501983642578125, -1.21673583984375, -1.1832733154296875, -1.149810791015625, -1.1163482666015625, -1.0828857421875, -1.0494232177734375, -1.015960693359375, -0.9824981689453125, -0.94903564453125, -0.9155731201171875, -0.882110595703125, -0.8486480712890625, -0.815185546875, -0.7817230224609375, -0.748260498046875, -0.7147979736328125, -0.68133544921875, -0.6478729248046875, -0.614410400390625, -0.5809478759765625, -0.5474853515625, -0.5140228271484375, -0.480560302734375, -0.4470977783203125, -0.41363525390625, -0.3801727294921875, -0.346710205078125, -0.3132476806640625, -0.27978515625, -0.2463226318359375, -0.212860107421875, -0.1793975830078125, -0.14593505859375, -0.1124725341796875, -0.079010009765625, -0.0455474853515625, -0.0120849609375, 0.0213775634765625, 0.054840087890625, 0.0883026123046875, 0.12176513671875, 0.1552276611328125, 0.188690185546875, 0.2221527099609375, 0.255615234375, 0.2890777587890625, 0.322540283203125, 0.3560028076171875, 0.38946533203125, 0.4229278564453125, 0.456390380859375, 0.4898529052734375, 0.5233154296875, 0.5567779541015625, 0.590240478515625, 0.6237030029296875, 0.65716552734375, 0.6906280517578125, 0.724090576171875, 0.7575531005859375, 0.791015625]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 3.0, 5.0, 9.0, 15.0, 24.0, 43.0, 51.0, 71.0, 88.0, 88.0, 106.0, 105.0, 99.0, 85.0, 53.0, 45.0, 36.0, 25.0, 19.0, 11.0, 11.0, 3.0, 6.0, 4.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.4375, -2.3855438232421875, -2.333587646484375, -2.2816314697265625, -2.22967529296875, -2.1777191162109375, -2.125762939453125, -2.0738067626953125, -2.0218505859375, -1.9698944091796875, -1.917938232421875, -1.8659820556640625, -1.81402587890625, -1.7620697021484375, -1.710113525390625, -1.6581573486328125, -1.606201171875, -1.5542449951171875, -1.502288818359375, -1.4503326416015625, -1.39837646484375, -1.3464202880859375, -1.294464111328125, -1.2425079345703125, -1.1905517578125, -1.1385955810546875, -1.086639404296875, -1.0346832275390625, -0.98272705078125, -0.9307708740234375, -0.878814697265625, -0.8268585205078125, -0.77490234375, -0.7229461669921875, -0.670989990234375, -0.6190338134765625, -0.56707763671875, -0.5151214599609375, -0.463165283203125, -0.4112091064453125, -0.3592529296875, -0.3072967529296875, -0.255340576171875, -0.2033843994140625, -0.15142822265625, -0.0994720458984375, -0.047515869140625, 0.0044403076171875, 0.056396484375, 0.1083526611328125, 0.160308837890625, 0.2122650146484375, 0.26422119140625, 0.3161773681640625, 0.368133544921875, 0.4200897216796875, 0.4720458984375, 0.5240020751953125, 0.575958251953125, 0.6279144287109375, 0.67987060546875, 0.7318267822265625, 0.783782958984375, 0.8357391357421875, 0.8876953125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 4.0, 10.0, 10.0, 12.0, 20.0, 31.0, 50.0, 84.0, 156.0, 248.0, 449.0, 1015.0, 2702.0, 7728.0, 29591.0, 186522.0, 2978607.0, 879457.0, 80889.0, 17803.0, 5165.0, 1895.0, 808.0, 421.0, 218.0, 150.0, 73.0, 53.0, 36.0, 24.0, 19.0, 13.0, 6.0, 5.0, 6.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.71875, -1.6693115234375, -1.619873046875, -1.5704345703125, -1.52099609375, -1.4715576171875, -1.422119140625, -1.3726806640625, -1.3232421875, -1.2738037109375, -1.224365234375, -1.1749267578125, -1.12548828125, -1.0760498046875, -1.026611328125, -0.9771728515625, -0.927734375, -0.8782958984375, -0.828857421875, -0.7794189453125, -0.72998046875, -0.6805419921875, -0.631103515625, -0.5816650390625, -0.5322265625, -0.4827880859375, -0.433349609375, -0.3839111328125, -0.33447265625, -0.2850341796875, -0.235595703125, -0.1861572265625, -0.13671875, -0.0872802734375, -0.037841796875, 0.0115966796875, 0.06103515625, 0.1104736328125, 0.159912109375, 0.2093505859375, 0.2587890625, 0.3082275390625, 0.357666015625, 0.4071044921875, 0.45654296875, 0.5059814453125, 0.555419921875, 0.6048583984375, 0.654296875, 0.7037353515625, 0.753173828125, 0.8026123046875, 0.85205078125, 0.9014892578125, 0.950927734375, 1.0003662109375, 1.0498046875, 1.0992431640625, 1.148681640625, 1.1981201171875, 1.24755859375, 1.2969970703125, 1.346435546875, 1.3958740234375, 1.4453125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 7.0, 5.0, 15.0, 14.0, 17.0, 26.0, 24.0, 63.0, 101.0, 121.0, 265.0, 442.0, 686.0, 775.0, 589.0, 305.0, 191.0, 139.0, 74.0, 34.0, 38.0, 43.0, 31.0, 18.0, 10.0, 10.0, 8.0, 4.0, 8.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.9130859375, -1.8517913818359375, -1.790496826171875, -1.7292022705078125, -1.66790771484375, -1.6066131591796875, -1.545318603515625, -1.4840240478515625, -1.4227294921875, -1.3614349365234375, -1.300140380859375, -1.2388458251953125, -1.17755126953125, -1.1162567138671875, -1.054962158203125, -0.9936676025390625, -0.932373046875, -0.8710784912109375, -0.809783935546875, -0.7484893798828125, -0.68719482421875, -0.6259002685546875, -0.564605712890625, -0.5033111572265625, -0.4420166015625, -0.3807220458984375, -0.319427490234375, -0.2581329345703125, -0.19683837890625, -0.1355438232421875, -0.074249267578125, -0.0129547119140625, 0.04833984375, 0.1096343994140625, 0.170928955078125, 0.2322235107421875, 0.29351806640625, 0.3548126220703125, 0.416107177734375, 0.4774017333984375, 0.5386962890625, 0.5999908447265625, 0.661285400390625, 0.7225799560546875, 0.78387451171875, 0.8451690673828125, 0.906463623046875, 0.9677581787109375, 1.029052734375, 1.0903472900390625, 1.151641845703125, 1.2129364013671875, 1.27423095703125, 1.3355255126953125, 1.396820068359375, 1.4581146240234375, 1.5194091796875, 1.5807037353515625, 1.641998291015625, 1.7032928466796875, 1.76458740234375, 1.8258819580078125, 1.887176513671875, 1.9484710693359375, 2.009765625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 5.0, 31.0, 217.0, 438.0, 233.0, 53.0, 10.0, 10.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.59027099609375, -34.2432746887207, -32.896278381347656, -31.549283981323242, -30.202289581298828, -28.85529327392578, -27.508296966552734, -26.16130256652832, -24.814308166503906, -23.46731185913086, -22.120317459106445, -20.7733211517334, -19.426326751708984, -18.079330444335938, -16.73233413696289, -15.385339736938477, -14.03834342956543, -12.6913480758667, -11.344352722167969, -9.997356414794922, -8.650362014770508, -7.303366184234619, -5.9563703536987305, -4.609375, -3.2623796463012695, -1.9153841733932495, -0.5683887004852295, 0.7786068916320801, 2.1256022453308105, 3.472597599029541, 4.81959342956543, 6.16658878326416, 7.513584136962891, 8.860579490661621, 10.207574844360352, 11.554571151733398, 12.901565551757812, 14.24856185913086, 15.59555721282959, 16.94255256652832, 18.289546966552734, 19.63654327392578, 20.983537673950195, 22.330533981323242, 23.677528381347656, 25.024524688720703, 26.37152099609375, 27.718515396118164, 29.06551170349121, 30.412508010864258, 31.759502410888672, 33.10649871826172, 34.453495025634766, 35.80048751831055, 37.147483825683594, 38.49448013305664, 39.84147644042969, 41.188472747802734, 42.53546905517578, 43.88246154785156, 45.22945785522461, 46.576454162597656, 47.9234504699707, 49.27044677734375, 50.61743927001953]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 3.0, 1.0, 11.0, 4.0, 6.0, 9.0, 13.0, 12.0, 24.0, 30.0, 37.0, 46.0, 53.0, 68.0, 45.0, 62.0, 78.0, 44.0, 65.0, 64.0, 53.0, 38.0, 49.0, 37.0, 36.0, 22.0, 25.0, 27.0, 10.0, 14.0, 8.0, 3.0, 2.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.546370506286621, -11.097363471984863, -10.648356437683105, -10.199349403381348, -9.750341415405273, -9.301334381103516, -8.852327346801758, -8.4033203125, -7.954313278198242, -7.505306243896484, -7.056299209594727, -6.6072916984558105, -6.158284664154053, -5.709277629852295, -5.260270118713379, -4.811263084411621, -4.362256050109863, -3.9132490158081055, -3.4642417430877686, -3.0152344703674316, -2.566227436065674, -2.117220401763916, -1.668213129043579, -1.2192058563232422, -0.7701988220214844, -0.321191668510437, 0.12781548500061035, 0.5768226385116577, 1.025829792022705, 1.474836826324463, 1.9238440990447998, 2.3728513717651367, 2.821859359741211, 3.2708663940429688, 3.7198736667633057, 4.168880939483643, 4.6178879737854, 5.066895008087158, 5.515902519226074, 5.964909553527832, 6.41391658782959, 6.862923622131348, 7.3119306564331055, 7.7609381675720215, 8.209945678710938, 8.658952713012695, 9.107959747314453, 9.556966781616211, 10.005973815917969, 10.454980850219727, 10.903987884521484, 11.352994918823242, 11.802001953125, 12.251008987426758, 12.700016975402832, 13.14902400970459, 13.598031044006348, 14.047038078308105, 14.496045112609863, 14.945052146911621, 15.394060134887695, 15.843067169189453, 16.29207420349121, 16.74108123779297, 17.190088272094727]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 12.0, 21.0, 29.0, 35.0, 68.0, 127.0, 203.0, 416.0, 675.0, 1341.0, 2549.0, 5086.0, 10830.0, 24784.0, 56589.0, 131326.0, 269742.0, 285153.0, 145975.0, 63145.0, 26937.0, 12056.0, 5513.0, 2769.0, 1354.0, 811.0, 437.0, 221.0, 142.0, 74.0, 49.0, 40.0, 10.0, 7.0, 9.0, 6.0, 8.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0751953125, -1.0368804931640625, -0.998565673828125, -0.9602508544921875, -0.92193603515625, -0.8836212158203125, -0.845306396484375, -0.8069915771484375, -0.7686767578125, -0.7303619384765625, -0.692047119140625, -0.6537322998046875, -0.61541748046875, -0.5771026611328125, -0.538787841796875, -0.5004730224609375, -0.462158203125, -0.4238433837890625, -0.385528564453125, -0.3472137451171875, -0.30889892578125, -0.2705841064453125, -0.232269287109375, -0.1939544677734375, -0.1556396484375, -0.1173248291015625, -0.079010009765625, -0.0406951904296875, -0.00238037109375, 0.0359344482421875, 0.074249267578125, 0.1125640869140625, 0.15087890625, 0.1891937255859375, 0.227508544921875, 0.2658233642578125, 0.30413818359375, 0.3424530029296875, 0.380767822265625, 0.4190826416015625, 0.4573974609375, 0.4957122802734375, 0.534027099609375, 0.5723419189453125, 0.61065673828125, 0.6489715576171875, 0.687286376953125, 0.7256011962890625, 0.763916015625, 0.8022308349609375, 0.840545654296875, 0.8788604736328125, 0.91717529296875, 0.9554901123046875, 0.993804931640625, 1.0321197509765625, 1.0704345703125, 1.1087493896484375, 1.147064208984375, 1.1853790283203125, 1.22369384765625, 1.2620086669921875, 1.300323486328125, 1.3386383056640625, 1.376953125]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 5.0, 3.0, 5.0, 4.0, 10.0, 14.0, 14.0, 18.0, 22.0, 27.0, 36.0, 43.0, 53.0, 46.0, 60.0, 56.0, 70.0, 45.0, 56.0, 55.0, 50.0, 60.0, 38.0, 41.0, 22.0, 33.0, 29.0, 19.0, 18.0, 7.0, 9.0, 9.0, 5.0, 8.0, 4.0, 3.0, 6.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.0458984375, -1.0156402587890625, -0.985382080078125, -0.9551239013671875, -0.92486572265625, -0.8946075439453125, -0.864349365234375, -0.8340911865234375, -0.8038330078125, -0.7735748291015625, -0.743316650390625, -0.7130584716796875, -0.68280029296875, -0.6525421142578125, -0.622283935546875, -0.5920257568359375, -0.561767578125, -0.5315093994140625, -0.501251220703125, -0.4709930419921875, -0.44073486328125, -0.4104766845703125, -0.380218505859375, -0.3499603271484375, -0.3197021484375, -0.2894439697265625, -0.259185791015625, -0.2289276123046875, -0.19866943359375, -0.1684112548828125, -0.138153076171875, -0.1078948974609375, -0.07763671875, -0.0473785400390625, -0.017120361328125, 0.0131378173828125, 0.04339599609375, 0.0736541748046875, 0.103912353515625, 0.1341705322265625, 0.1644287109375, 0.1946868896484375, 0.224945068359375, 0.2552032470703125, 0.28546142578125, 0.3157196044921875, 0.345977783203125, 0.3762359619140625, 0.406494140625, 0.4367523193359375, 0.467010498046875, 0.4972686767578125, 0.52752685546875, 0.5577850341796875, 0.588043212890625, 0.6183013916015625, 0.6485595703125, 0.6788177490234375, 0.709075927734375, 0.7393341064453125, 0.76959228515625, 0.7998504638671875, 0.830108642578125, 0.8603668212890625, 0.890625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 7.0, 7.0, 12.0, 16.0, 22.0, 35.0, 34.0, 60.0, 70.0, 105.0, 157.0, 208.0, 330.0, 503.0, 932.0, 1827.0, 4932.0, 21657.0, 181740.0, 717725.0, 97391.0, 13417.0, 3601.0, 1528.0, 786.0, 457.0, 301.0, 196.0, 137.0, 105.0, 65.0, 44.0, 35.0, 34.0, 29.0, 9.0, 12.0, 6.0, 10.0, 5.0, 3.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.5, -2.40863037109375, -2.3172607421875, -2.22589111328125, -2.134521484375, -2.04315185546875, -1.9517822265625, -1.86041259765625, -1.76904296875, -1.67767333984375, -1.5863037109375, -1.49493408203125, -1.403564453125, -1.31219482421875, -1.2208251953125, -1.12945556640625, -1.0380859375, -0.94671630859375, -0.8553466796875, -0.76397705078125, -0.672607421875, -0.58123779296875, -0.4898681640625, -0.39849853515625, -0.30712890625, -0.21575927734375, -0.1243896484375, -0.03302001953125, 0.058349609375, 0.14971923828125, 0.2410888671875, 0.33245849609375, 0.423828125, 0.51519775390625, 0.6065673828125, 0.69793701171875, 0.789306640625, 0.88067626953125, 0.9720458984375, 1.06341552734375, 1.15478515625, 1.24615478515625, 1.3375244140625, 1.42889404296875, 1.520263671875, 1.61163330078125, 1.7030029296875, 1.79437255859375, 1.8857421875, 1.97711181640625, 2.0684814453125, 2.15985107421875, 2.251220703125, 2.34259033203125, 2.4339599609375, 2.52532958984375, 2.61669921875, 2.70806884765625, 2.7994384765625, 2.89080810546875, 2.982177734375, 3.07354736328125, 3.1649169921875, 3.25628662109375, 3.34765625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 4.0, 2.0, 7.0, 4.0, 15.0, 18.0, 17.0, 24.0, 14.0, 21.0, 35.0, 24.0, 33.0, 37.0, 44.0, 38.0, 49.0, 55.0, 59.0, 41.0, 55.0, 54.0, 44.0, 43.0, 41.0, 35.0, 34.0, 31.0, 16.0, 19.0, 21.0, 16.0, 8.0, 8.0, 10.0, 7.0, 5.0, 2.0, 4.0, 3.0, 0.0, 7.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9296875, -2.828399658203125, -2.72711181640625, -2.625823974609375, -2.5245361328125, -2.423248291015625, -2.32196044921875, -2.220672607421875, -2.119384765625, -2.018096923828125, -1.91680908203125, -1.815521240234375, -1.7142333984375, -1.612945556640625, -1.51165771484375, -1.410369873046875, -1.30908203125, -1.207794189453125, -1.10650634765625, -1.005218505859375, -0.9039306640625, -0.802642822265625, -0.70135498046875, -0.600067138671875, -0.498779296875, -0.397491455078125, -0.29620361328125, -0.194915771484375, -0.0936279296875, 0.007659912109375, 0.10894775390625, 0.210235595703125, 0.3115234375, 0.412811279296875, 0.51409912109375, 0.615386962890625, 0.7166748046875, 0.817962646484375, 0.91925048828125, 1.020538330078125, 1.121826171875, 1.223114013671875, 1.32440185546875, 1.425689697265625, 1.5269775390625, 1.628265380859375, 1.72955322265625, 1.830841064453125, 1.93212890625, 2.033416748046875, 2.13470458984375, 2.235992431640625, 2.3372802734375, 2.438568115234375, 2.53985595703125, 2.641143798828125, 2.742431640625, 2.843719482421875, 2.94500732421875, 3.046295166015625, 3.1475830078125, 3.248870849609375, 3.35015869140625, 3.451446533203125, 3.552734375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 6.0, 5.0, 7.0, 6.0, 16.0, 17.0, 32.0, 36.0, 84.0, 135.0, 308.0, 809.0, 2632.0, 13474.0, 122817.0, 780671.0, 110924.0, 12663.0, 2516.0, 748.0, 330.0, 127.0, 84.0, 40.0, 19.0, 21.0, 18.0, 4.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.0185546875, -0.989013671875, -0.95947265625, -0.929931640625, -0.900390625, -0.870849609375, -0.84130859375, -0.811767578125, -0.7822265625, -0.752685546875, -0.72314453125, -0.693603515625, -0.6640625, -0.634521484375, -0.60498046875, -0.575439453125, -0.5458984375, -0.516357421875, -0.48681640625, -0.457275390625, -0.427734375, -0.398193359375, -0.36865234375, -0.339111328125, -0.3095703125, -0.280029296875, -0.25048828125, -0.220947265625, -0.19140625, -0.161865234375, -0.13232421875, -0.102783203125, -0.0732421875, -0.043701171875, -0.01416015625, 0.015380859375, 0.044921875, 0.074462890625, 0.10400390625, 0.133544921875, 0.1630859375, 0.192626953125, 0.22216796875, 0.251708984375, 0.28125, 0.310791015625, 0.34033203125, 0.369873046875, 0.3994140625, 0.428955078125, 0.45849609375, 0.488037109375, 0.517578125, 0.547119140625, 0.57666015625, 0.606201171875, 0.6357421875, 0.665283203125, 0.69482421875, 0.724365234375, 0.75390625, 0.783447265625, 0.81298828125, 0.842529296875, 0.8720703125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 10.0, 9.0, 11.0, 8.0, 19.0, 31.0, 32.0, 35.0, 69.0, 98.0, 117.0, 120.0, 114.0, 86.0, 87.0, 44.0, 29.0, 25.0, 13.0, 12.0, 9.0, 6.0, 2.0, 6.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00021505355834960938, -0.0002069510519504547, -0.00019884854555130005, -0.00019074603915214539, -0.00018264353275299072, -0.00017454102635383606, -0.0001664385199546814, -0.00015833601355552673, -0.00015023350715637207, -0.0001421310007572174, -0.00013402849435806274, -0.00012592598795890808, -0.00011782348155975342, -0.00010972097516059875, -0.00010161846876144409, -9.351596236228943e-05, -8.541345596313477e-05, -7.73109495639801e-05, -6.920844316482544e-05, -6.110593676567078e-05, -5.300343036651611e-05, -4.490092396736145e-05, -3.679841756820679e-05, -2.8695911169052124e-05, -2.059340476989746e-05, -1.2490898370742798e-05, -4.388391971588135e-06, 3.7141144275665283e-06, 1.1816620826721191e-05, 1.9919127225875854e-05, 2.8021633625030518e-05, 3.612414002418518e-05, 4.4226646423339844e-05, 5.232915282249451e-05, 6.043165922164917e-05, 6.853416562080383e-05, 7.66366720199585e-05, 8.473917841911316e-05, 9.284168481826782e-05, 0.00010094419121742249, 0.00010904669761657715, 0.00011714920401573181, 0.00012525171041488647, 0.00013335421681404114, 0.0001414567232131958, 0.00014955922961235046, 0.00015766173601150513, 0.0001657642424106598, 0.00017386674880981445, 0.00018196925520896912, 0.00019007176160812378, 0.00019817426800727844, 0.0002062767744064331, 0.00021437928080558777, 0.00022248178720474243, 0.0002305842936038971, 0.00023868680000305176, 0.0002467893064022064, 0.0002548918128013611, 0.00026299431920051575, 0.0002710968255996704, 0.0002791993319988251, 0.00028730183839797974, 0.0002954043447971344, 0.00030350685119628906]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 8.0, 10.0, 14.0, 20.0, 23.0, 48.0, 81.0, 162.0, 325.0, 645.0, 1574.0, 5123.0, 28776.0, 324271.0, 632019.0, 45118.0, 6863.0, 1929.0, 775.0, 356.0, 193.0, 81.0, 62.0, 33.0, 15.0, 12.0, 11.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.73046875, -0.7035140991210938, -0.6765594482421875, -0.6496047973632812, -0.622650146484375, -0.5956954956054688, -0.5687408447265625, -0.5417861938476562, -0.51483154296875, -0.48787689208984375, -0.4609222412109375, -0.43396759033203125, -0.407012939453125, -0.38005828857421875, -0.3531036376953125, -0.32614898681640625, -0.2991943359375, -0.27223968505859375, -0.2452850341796875, -0.21833038330078125, -0.191375732421875, -0.16442108154296875, -0.1374664306640625, -0.11051177978515625, -0.08355712890625, -0.05660247802734375, -0.0296478271484375, -0.00269317626953125, 0.024261474609375, 0.05121612548828125, 0.0781707763671875, 0.10512542724609375, 0.132080078125, 0.15903472900390625, 0.1859893798828125, 0.21294403076171875, 0.239898681640625, 0.26685333251953125, 0.2938079833984375, 0.32076263427734375, 0.34771728515625, 0.37467193603515625, 0.4016265869140625, 0.42858123779296875, 0.455535888671875, 0.48249053955078125, 0.5094451904296875, 0.5363998413085938, 0.5633544921875, 0.5903091430664062, 0.6172637939453125, 0.6442184448242188, 0.671173095703125, 0.6981277465820312, 0.7250823974609375, 0.7520370483398438, 0.77899169921875, 0.8059463500976562, 0.8329010009765625, 0.8598556518554688, 0.886810302734375, 0.9137649536132812, 0.9407196044921875, 0.9676742553710938, 0.99462890625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 4.0, 4.0, 7.0, 3.0, 9.0, 21.0, 30.0, 34.0, 37.0, 52.0, 56.0, 80.0, 91.0, 87.0, 91.0, 93.0, 77.0, 56.0, 57.0, 43.0, 18.0, 17.0, 11.0, 9.0, 7.0, 3.0, 5.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.43408203125, -0.40940093994140625, -0.3847198486328125, -0.36003875732421875, -0.335357666015625, -0.31067657470703125, -0.2859954833984375, -0.26131439208984375, -0.23663330078125, -0.21195220947265625, -0.1872711181640625, -0.16259002685546875, -0.137908935546875, -0.11322784423828125, -0.0885467529296875, -0.06386566162109375, -0.0391845703125, -0.01450347900390625, 0.0101776123046875, 0.03485870361328125, 0.059539794921875, 0.08422088623046875, 0.1089019775390625, 0.13358306884765625, 0.15826416015625, 0.18294525146484375, 0.2076263427734375, 0.23230743408203125, 0.256988525390625, 0.28166961669921875, 0.3063507080078125, 0.33103179931640625, 0.355712890625, 0.38039398193359375, 0.4050750732421875, 0.42975616455078125, 0.454437255859375, 0.47911834716796875, 0.5037994384765625, 0.5284805297851562, 0.55316162109375, 0.5778427124023438, 0.6025238037109375, 0.6272048950195312, 0.651885986328125, 0.6765670776367188, 0.7012481689453125, 0.7259292602539062, 0.7506103515625, 0.7752914428710938, 0.7999725341796875, 0.8246536254882812, 0.849334716796875, 0.8740158081054688, 0.8986968994140625, 0.9233779907226562, 0.94805908203125, 0.9727401733398438, 0.9974212646484375, 1.0221023559570312, 1.046783447265625, 1.0714645385742188, 1.0961456298828125, 1.1208267211914062, 1.1455078125]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 6.0, 13.0, 21.0, 43.0, 82.0, 117.0, 259.0, 204.0, 113.0, 63.0, 33.0, 13.0, 15.0, 9.0, 7.0, 2.0, 1.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.277312278747559, -12.66807746887207, -12.058841705322266, -11.449606895446777, -10.840372085571289, -10.231136322021484, -9.621901512145996, -9.012666702270508, -8.403430938720703, -7.794195652008057, -7.18496036529541, -6.575725555419922, -5.966490268707275, -5.357254981994629, -4.748020172119141, -4.138784885406494, -3.5295495986938477, -2.920314311981201, -2.311079263687134, -1.7018440961837769, -1.09260892868042, -0.48337364196777344, 0.12586140632629395, 0.7350964546203613, 1.3443317413330078, 1.9535669088363647, 2.5628020763397217, 3.172037124633789, 3.7812724113464355, 4.390507698059082, 4.99974250793457, 5.608977794647217, 6.21821403503418, 6.827449321746826, 7.436684608459473, 8.045919418334961, 8.655155181884766, 9.264389991760254, 9.873624801635742, 10.482860565185547, 11.092095375061035, 11.701330184936523, 12.310565948486328, 12.919800758361816, 13.529035568237305, 14.13827133178711, 14.747506141662598, 15.356740951538086, 15.96597671508789, 16.575212478637695, 17.184446334838867, 17.793682098388672, 18.402917861938477, 19.01215362548828, 19.621387481689453, 20.230623245239258, 20.839859008789062, 21.449094772338867, 22.05832862854004, 22.667564392089844, 23.27680015563965, 23.886035919189453, 24.495269775390625, 25.10450553894043, 25.7137393951416]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 3.0, 2.0, 4.0, 4.0, 10.0, 11.0, 9.0, 12.0, 18.0, 10.0, 10.0, 13.0, 22.0, 26.0, 29.0, 41.0, 34.0, 29.0, 34.0, 71.0, 79.0, 85.0, 70.0, 55.0, 44.0, 37.0, 36.0, 33.0, 28.0, 26.0, 13.0, 22.0, 17.0, 9.0, 11.0, 11.0, 5.0, 12.0, 8.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.883549690246582, -13.452656745910645, -13.02176284790039, -12.590869903564453, -12.159976959228516, -11.729084014892578, -11.29819107055664, -10.867297172546387, -10.43640422821045, -10.005511283874512, -9.574617385864258, -9.14372444152832, -8.712831497192383, -8.281938552856445, -7.85104513168335, -7.420151710510254, -6.989258766174316, -6.558365821838379, -6.127472400665283, -5.6965789794921875, -5.26568603515625, -4.8347930908203125, -4.403899669647217, -3.9730064868927, -3.5421133041381836, -3.111220121383667, -2.6803269386291504, -2.249433755874634, -1.8185405731201172, -1.3876473903656006, -0.956754207611084, -0.5258610248565674, -0.09496688842773438, 0.3359262943267822, 0.7668194770812988, 1.1977126598358154, 1.628605842590332, 2.0594990253448486, 2.4903922080993652, 2.921285390853882, 3.3521785736083984, 3.783071756362915, 4.213964939117432, 4.644858360290527, 5.075751304626465, 5.506644248962402, 5.937537670135498, 6.368431091308594, 6.799324035644531, 7.230216979980469, 7.6611104011535645, 8.09200382232666, 8.522896766662598, 8.953789710998535, 9.384683609008789, 9.815576553344727, 10.246469497680664, 10.677362442016602, 11.108255386352539, 11.539149284362793, 11.97004222869873, 12.400935173034668, 12.831829071044922, 13.26272201538086, 13.693614959716797]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 14.0, 13.0, 19.0, 43.0, 58.0, 95.0, 187.0, 385.0, 889.0, 2632.0, 9492.0, 55217.0, 630481.0, 2895416.0, 534025.0, 51102.0, 9878.0, 2646.0, 893.0, 378.0, 179.0, 81.0, 50.0, 39.0, 21.0, 18.0, 9.0, 6.0, 1.0, 7.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.4296875, -1.3904876708984375, -1.351287841796875, -1.3120880126953125, -1.27288818359375, -1.2336883544921875, -1.194488525390625, -1.1552886962890625, -1.1160888671875, -1.0768890380859375, -1.037689208984375, -0.9984893798828125, -0.95928955078125, -0.9200897216796875, -0.880889892578125, -0.8416900634765625, -0.802490234375, -0.7632904052734375, -0.724090576171875, -0.6848907470703125, -0.64569091796875, -0.6064910888671875, -0.567291259765625, -0.5280914306640625, -0.4888916015625, -0.4496917724609375, -0.410491943359375, -0.3712921142578125, -0.33209228515625, -0.2928924560546875, -0.253692626953125, -0.2144927978515625, -0.17529296875, -0.1360931396484375, -0.096893310546875, -0.0576934814453125, -0.01849365234375, 0.0207061767578125, 0.059906005859375, 0.0991058349609375, 0.1383056640625, 0.1775054931640625, 0.216705322265625, 0.2559051513671875, 0.29510498046875, 0.3343048095703125, 0.373504638671875, 0.4127044677734375, 0.451904296875, 0.4911041259765625, 0.530303955078125, 0.5695037841796875, 0.60870361328125, 0.6479034423828125, 0.687103271484375, 0.7263031005859375, 0.7655029296875, 0.8047027587890625, 0.843902587890625, 0.8831024169921875, 0.92230224609375, 0.9615020751953125, 1.000701904296875, 1.0399017333984375, 1.0791015625]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 6.0, 7.0, 8.0, 14.0, 20.0, 15.0, 30.0, 31.0, 36.0, 43.0, 44.0, 66.0, 51.0, 71.0, 58.0, 55.0, 52.0, 61.0, 46.0, 40.0, 38.0, 42.0, 41.0, 24.0, 33.0, 13.0, 14.0, 12.0, 9.0, 5.0, 6.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.06640625, -1.0360107421875, -1.005615234375, -0.9752197265625, -0.94482421875, -0.9144287109375, -0.884033203125, -0.8536376953125, -0.8232421875, -0.7928466796875, -0.762451171875, -0.7320556640625, -0.70166015625, -0.6712646484375, -0.640869140625, -0.6104736328125, -0.580078125, -0.5496826171875, -0.519287109375, -0.4888916015625, -0.45849609375, -0.4281005859375, -0.397705078125, -0.3673095703125, -0.3369140625, -0.3065185546875, -0.276123046875, -0.2457275390625, -0.21533203125, -0.1849365234375, -0.154541015625, -0.1241455078125, -0.09375, -0.0633544921875, -0.032958984375, -0.0025634765625, 0.02783203125, 0.0582275390625, 0.088623046875, 0.1190185546875, 0.1494140625, 0.1798095703125, 0.210205078125, 0.2406005859375, 0.27099609375, 0.3013916015625, 0.331787109375, 0.3621826171875, 0.392578125, 0.4229736328125, 0.453369140625, 0.4837646484375, 0.51416015625, 0.5445556640625, 0.574951171875, 0.6053466796875, 0.6357421875, 0.6661376953125, 0.696533203125, 0.7269287109375, 0.75732421875, 0.7877197265625, 0.818115234375, 0.8485107421875, 0.87890625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 6.0, 6.0, 5.0, 3.0, 12.0, 15.0, 29.0, 37.0, 47.0, 102.0, 165.0, 246.0, 542.0, 1134.0, 2808.0, 9240.0, 43062.0, 521962.0, 3370967.0, 208960.0, 25516.0, 5862.0, 1859.0, 808.0, 377.0, 202.0, 112.0, 63.0, 41.0, 29.0, 16.0, 13.0, 10.0, 10.0, 6.0, 4.0, 4.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6513671875, -1.6003265380859375, -1.549285888671875, -1.4982452392578125, -1.44720458984375, -1.3961639404296875, -1.345123291015625, -1.2940826416015625, -1.2430419921875, -1.1920013427734375, -1.140960693359375, -1.0899200439453125, -1.03887939453125, -0.9878387451171875, -0.936798095703125, -0.8857574462890625, -0.834716796875, -0.7836761474609375, -0.732635498046875, -0.6815948486328125, -0.63055419921875, -0.5795135498046875, -0.528472900390625, -0.4774322509765625, -0.4263916015625, -0.3753509521484375, -0.324310302734375, -0.2732696533203125, -0.22222900390625, -0.1711883544921875, -0.120147705078125, -0.0691070556640625, -0.01806640625, 0.0329742431640625, 0.084014892578125, 0.1350555419921875, 0.18609619140625, 0.2371368408203125, 0.288177490234375, 0.3392181396484375, 0.3902587890625, 0.4412994384765625, 0.492340087890625, 0.5433807373046875, 0.59442138671875, 0.6454620361328125, 0.696502685546875, 0.7475433349609375, 0.798583984375, 0.8496246337890625, 0.900665283203125, 0.9517059326171875, 1.00274658203125, 1.0537872314453125, 1.104827880859375, 1.1558685302734375, 1.2069091796875, 1.2579498291015625, 1.308990478515625, 1.3600311279296875, 1.41107177734375, 1.4621124267578125, 1.513153076171875, 1.5641937255859375, 1.615234375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 4.0, 0.0, 3.0, 5.0, 1.0, 5.0, 8.0, 10.0, 9.0, 14.0, 10.0, 23.0, 24.0, 29.0, 46.0, 64.0, 117.0, 198.0, 271.0, 442.0, 570.0, 631.0, 502.0, 385.0, 247.0, 155.0, 90.0, 54.0, 44.0, 34.0, 17.0, 14.0, 14.0, 9.0, 6.0, 9.0, 6.0, 4.0, 4.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.345703125, -1.2996063232421875, -1.253509521484375, -1.2074127197265625, -1.16131591796875, -1.1152191162109375, -1.069122314453125, -1.0230255126953125, -0.9769287109375, -0.9308319091796875, -0.884735107421875, -0.8386383056640625, -0.79254150390625, -0.7464447021484375, -0.700347900390625, -0.6542510986328125, -0.608154296875, -0.5620574951171875, -0.515960693359375, -0.4698638916015625, -0.42376708984375, -0.3776702880859375, -0.331573486328125, -0.2854766845703125, -0.2393798828125, -0.1932830810546875, -0.147186279296875, -0.1010894775390625, -0.05499267578125, -0.0088958740234375, 0.037200927734375, 0.0832977294921875, 0.12939453125, 0.1754913330078125, 0.221588134765625, 0.2676849365234375, 0.31378173828125, 0.3598785400390625, 0.405975341796875, 0.4520721435546875, 0.4981689453125, 0.5442657470703125, 0.590362548828125, 0.6364593505859375, 0.68255615234375, 0.7286529541015625, 0.774749755859375, 0.8208465576171875, 0.866943359375, 0.9130401611328125, 0.959136962890625, 1.0052337646484375, 1.05133056640625, 1.0974273681640625, 1.143524169921875, 1.1896209716796875, 1.2357177734375, 1.2818145751953125, 1.327911376953125, 1.3740081787109375, 1.42010498046875, 1.4662017822265625, 1.512298583984375, 1.5583953857421875, 1.6044921875]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 6.0, 23.0, 61.0, 427.0, 396.0, 64.0, 16.0, 7.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.95310592651367, -48.634666442871094, -47.31623077392578, -45.9977912902832, -44.679351806640625, -43.36091613769531, -42.042476654052734, -40.724037170410156, -39.405601501464844, -38.087162017822266, -36.76872634887695, -35.450286865234375, -34.13185119628906, -32.813411712646484, -31.494972229003906, -30.17653465270996, -28.858097076416016, -27.53965950012207, -26.221221923828125, -24.902782440185547, -23.5843448638916, -22.265907287597656, -20.947467803955078, -19.629030227661133, -18.310592651367188, -16.992155075073242, -15.67371654510498, -14.355278015136719, -13.036840438842773, -11.718402862548828, -10.399964332580566, -9.081525802612305, -7.763092041015625, -6.4446539878845215, -5.126215934753418, -3.8077778816223145, -2.489339828491211, -1.1709017753601074, 0.1475362777709961, 1.4659748077392578, 2.784412384033203, 4.102850437164307, 5.42128849029541, 6.739726543426514, 8.058164596557617, 9.376602172851562, 10.695040702819824, 12.013479232788086, 13.331916809082031, 14.650354385375977, 15.968792915344238, 17.2872314453125, 18.605669021606445, 19.92410659790039, 21.24254608154297, 22.560983657836914, 23.87942123413086, 25.197858810424805, 26.51629638671875, 27.834735870361328, 29.153173446655273, 30.47161102294922, 31.790050506591797, 33.108489990234375, 34.42692565917969]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 6.0, 8.0, 14.0, 13.0, 9.0, 16.0, 27.0, 17.0, 18.0, 36.0, 28.0, 44.0, 52.0, 58.0, 48.0, 59.0, 60.0, 60.0, 44.0, 57.0, 36.0, 53.0, 31.0, 35.0, 32.0, 32.0, 22.0, 23.0, 16.0, 13.0, 10.0, 10.0, 3.0, 4.0, 4.0, 4.0, 3.0, 2.0, 2.0, 2.0, 2.0], "bins": [-10.923690795898438, -10.651545524597168, -10.379400253295898, -10.107254981994629, -9.83510971069336, -9.56296443939209, -9.29081916809082, -9.018672943115234, -8.746528625488281, -8.474383354187012, -8.202238082885742, -7.930092811584473, -7.657947540283203, -7.385802268981934, -7.113656520843506, -6.841511249542236, -6.569365501403809, -6.297220230102539, -6.0250749588012695, -5.7529296875, -5.4807844161987305, -5.208639144897461, -4.936493396759033, -4.664348125457764, -4.392202854156494, -4.120057582855225, -3.847912311553955, -3.5757668018341064, -3.303621530532837, -3.0314762592315674, -2.7593307495117188, -2.487185478210449, -2.215041160583496, -1.9428958892822266, -1.6707504987716675, -1.3986051082611084, -1.1264598369598389, -0.8543145656585693, -0.5821691751480103, -0.31002378463745117, -0.03787851333618164, 0.23426681756973267, 0.506412148475647, 0.7785574793815613, 1.0507028102874756, 1.3228480815887451, 1.5949934720993042, 1.8671388626098633, 2.139284133911133, 2.4114294052124023, 2.683574676513672, 2.9557201862335205, 3.22786545753479, 3.5000107288360596, 3.772156238555908, 4.044301509857178, 4.316446781158447, 4.588592052459717, 4.860737323760986, 5.132882595062256, 5.405028343200684, 5.677173614501953, 5.949318885803223, 6.221464157104492, 6.493609428405762]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 7.0, 5.0, 9.0, 7.0, 26.0, 28.0, 49.0, 96.0, 124.0, 209.0, 370.0, 533.0, 935.0, 1696.0, 2816.0, 5194.0, 9801.0, 19132.0, 38872.0, 79475.0, 155023.0, 235557.0, 224028.0, 136496.0, 68695.0, 33501.0, 16688.0, 8562.0, 4529.0, 2497.0, 1395.0, 868.0, 512.0, 299.0, 184.0, 130.0, 82.0, 45.0, 27.0, 23.0, 13.0, 5.0, 6.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.89892578125, -0.8707427978515625, -0.842559814453125, -0.8143768310546875, -0.78619384765625, -0.7580108642578125, -0.729827880859375, -0.7016448974609375, -0.6734619140625, -0.6452789306640625, -0.617095947265625, -0.5889129638671875, -0.56072998046875, -0.5325469970703125, -0.504364013671875, -0.4761810302734375, -0.447998046875, -0.4198150634765625, -0.391632080078125, -0.3634490966796875, -0.33526611328125, -0.3070831298828125, -0.278900146484375, -0.2507171630859375, -0.2225341796875, -0.1943511962890625, -0.166168212890625, -0.1379852294921875, -0.10980224609375, -0.0816192626953125, -0.053436279296875, -0.0252532958984375, 0.0029296875, 0.0311126708984375, 0.059295654296875, 0.0874786376953125, 0.11566162109375, 0.1438446044921875, 0.172027587890625, 0.2002105712890625, 0.2283935546875, 0.2565765380859375, 0.284759521484375, 0.3129425048828125, 0.34112548828125, 0.3693084716796875, 0.397491455078125, 0.4256744384765625, 0.453857421875, 0.4820404052734375, 0.510223388671875, 0.5384063720703125, 0.56658935546875, 0.5947723388671875, 0.622955322265625, 0.6511383056640625, 0.6793212890625, 0.7075042724609375, 0.735687255859375, 0.7638702392578125, 0.79205322265625, 0.8202362060546875, 0.848419189453125, 0.8766021728515625, 0.90478515625]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 4.0, 3.0, 11.0, 4.0, 10.0, 11.0, 20.0, 23.0, 29.0, 25.0, 36.0, 35.0, 39.0, 63.0, 51.0, 50.0, 62.0, 59.0, 61.0, 55.0, 39.0, 39.0, 49.0, 37.0, 24.0, 28.0, 34.0, 13.0, 20.0, 21.0, 14.0, 9.0, 6.0, 6.0, 7.0, 3.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.013671875, -0.984344482421875, -0.95501708984375, -0.925689697265625, -0.8963623046875, -0.867034912109375, -0.83770751953125, -0.808380126953125, -0.779052734375, -0.749725341796875, -0.72039794921875, -0.691070556640625, -0.6617431640625, -0.632415771484375, -0.60308837890625, -0.573760986328125, -0.54443359375, -0.515106201171875, -0.48577880859375, -0.456451416015625, -0.4271240234375, -0.397796630859375, -0.36846923828125, -0.339141845703125, -0.309814453125, -0.280487060546875, -0.25115966796875, -0.221832275390625, -0.1925048828125, -0.163177490234375, -0.13385009765625, -0.104522705078125, -0.0751953125, -0.045867919921875, -0.01654052734375, 0.012786865234375, 0.0421142578125, 0.071441650390625, 0.10076904296875, 0.130096435546875, 0.159423828125, 0.188751220703125, 0.21807861328125, 0.247406005859375, 0.2767333984375, 0.306060791015625, 0.33538818359375, 0.364715576171875, 0.39404296875, 0.423370361328125, 0.45269775390625, 0.482025146484375, 0.5113525390625, 0.540679931640625, 0.57000732421875, 0.599334716796875, 0.628662109375, 0.657989501953125, 0.68731689453125, 0.716644287109375, 0.7459716796875, 0.775299072265625, 0.80462646484375, 0.833953857421875, 0.86328125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 9.0, 4.0, 10.0, 9.0, 18.0, 16.0, 39.0, 38.0, 58.0, 75.0, 128.0, 217.0, 428.0, 1083.0, 3454.0, 15112.0, 89748.0, 626788.0, 259822.0, 40284.0, 7592.0, 2001.0, 743.0, 338.0, 184.0, 95.0, 86.0, 57.0, 35.0, 22.0, 15.0, 15.0, 14.0, 10.0, 6.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.328125, -2.257110595703125, -2.18609619140625, -2.115081787109375, -2.0440673828125, -1.973052978515625, -1.90203857421875, -1.831024169921875, -1.760009765625, -1.688995361328125, -1.61798095703125, -1.546966552734375, -1.4759521484375, -1.404937744140625, -1.33392333984375, -1.262908935546875, -1.19189453125, -1.120880126953125, -1.04986572265625, -0.978851318359375, -0.9078369140625, -0.836822509765625, -0.76580810546875, -0.694793701171875, -0.623779296875, -0.552764892578125, -0.48175048828125, -0.410736083984375, -0.3397216796875, -0.268707275390625, -0.19769287109375, -0.126678466796875, -0.0556640625, 0.015350341796875, 0.08636474609375, 0.157379150390625, 0.2283935546875, 0.299407958984375, 0.37042236328125, 0.441436767578125, 0.512451171875, 0.583465576171875, 0.65447998046875, 0.725494384765625, 0.7965087890625, 0.867523193359375, 0.93853759765625, 1.009552001953125, 1.08056640625, 1.151580810546875, 1.22259521484375, 1.293609619140625, 1.3646240234375, 1.435638427734375, 1.50665283203125, 1.577667236328125, 1.648681640625, 1.719696044921875, 1.79071044921875, 1.861724853515625, 1.9327392578125, 2.003753662109375, 2.07476806640625, 2.145782470703125, 2.216796875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 4.0, 10.0, 12.0, 13.0, 18.0, 20.0, 15.0, 25.0, 25.0, 34.0, 41.0, 32.0, 41.0, 55.0, 45.0, 54.0, 52.0, 60.0, 51.0, 49.0, 36.0, 43.0, 35.0, 39.0, 32.0, 19.0, 25.0, 22.0, 21.0, 12.0, 12.0, 10.0, 6.0, 5.0, 5.0, 6.0, 2.0, 1.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.0390625, -2.94879150390625, -2.8585205078125, -2.76824951171875, -2.677978515625, -2.58770751953125, -2.4974365234375, -2.40716552734375, -2.31689453125, -2.22662353515625, -2.1363525390625, -2.04608154296875, -1.955810546875, -1.86553955078125, -1.7752685546875, -1.68499755859375, -1.5947265625, -1.50445556640625, -1.4141845703125, -1.32391357421875, -1.233642578125, -1.14337158203125, -1.0531005859375, -0.96282958984375, -0.87255859375, -0.78228759765625, -0.6920166015625, -0.60174560546875, -0.511474609375, -0.42120361328125, -0.3309326171875, -0.24066162109375, -0.150390625, -0.06011962890625, 0.0301513671875, 0.12042236328125, 0.210693359375, 0.30096435546875, 0.3912353515625, 0.48150634765625, 0.57177734375, 0.66204833984375, 0.7523193359375, 0.84259033203125, 0.932861328125, 1.02313232421875, 1.1134033203125, 1.20367431640625, 1.2939453125, 1.38421630859375, 1.4744873046875, 1.56475830078125, 1.655029296875, 1.74530029296875, 1.8355712890625, 1.92584228515625, 2.01611328125, 2.10638427734375, 2.1966552734375, 2.28692626953125, 2.377197265625, 2.46746826171875, 2.5577392578125, 2.64801025390625, 2.73828125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 3.0, 3.0, 8.0, 12.0, 23.0, 27.0, 33.0, 59.0, 115.0, 185.0, 365.0, 913.0, 2413.0, 7340.0, 27607.0, 130535.0, 620114.0, 201151.0, 42087.0, 10268.0, 3163.0, 1094.0, 495.0, 226.0, 120.0, 60.0, 44.0, 31.0, 15.0, 15.0, 4.0, 11.0, 7.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.57470703125, -0.557098388671875, -0.53948974609375, -0.521881103515625, -0.5042724609375, -0.486663818359375, -0.46905517578125, -0.451446533203125, -0.433837890625, -0.416229248046875, -0.39862060546875, -0.381011962890625, -0.3634033203125, -0.345794677734375, -0.32818603515625, -0.310577392578125, -0.29296875, -0.275360107421875, -0.25775146484375, -0.240142822265625, -0.2225341796875, -0.204925537109375, -0.18731689453125, -0.169708251953125, -0.152099609375, -0.134490966796875, -0.11688232421875, -0.099273681640625, -0.0816650390625, -0.064056396484375, -0.04644775390625, -0.028839111328125, -0.01123046875, 0.006378173828125, 0.02398681640625, 0.041595458984375, 0.0592041015625, 0.076812744140625, 0.09442138671875, 0.112030029296875, 0.129638671875, 0.147247314453125, 0.16485595703125, 0.182464599609375, 0.2000732421875, 0.217681884765625, 0.23529052734375, 0.252899169921875, 0.2705078125, 0.288116455078125, 0.30572509765625, 0.323333740234375, 0.3409423828125, 0.358551025390625, 0.37615966796875, 0.393768310546875, 0.411376953125, 0.428985595703125, 0.44659423828125, 0.464202880859375, 0.4818115234375, 0.499420166015625, 0.51702880859375, 0.534637451171875, 0.55224609375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 7.0, 6.0, 10.0, 10.0, 10.0, 11.0, 23.0, 31.0, 35.0, 50.0, 65.0, 61.0, 82.0, 81.0, 95.0, 94.0, 78.0, 52.0, 42.0, 31.0, 24.0, 24.0, 20.0, 13.0, 10.0, 7.0, 6.0, 8.0, 6.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.00017845630645751953, -0.0001732315868139267, -0.00016800686717033386, -0.00016278214752674103, -0.0001575574278831482, -0.00015233270823955536, -0.00014710798859596252, -0.0001418832689523697, -0.00013665854930877686, -0.00013143382966518402, -0.0001262091100215912, -0.00012098439037799835, -0.00011575967073440552, -0.00011053495109081268, -0.00010531023144721985, -0.00010008551180362701, -9.486079216003418e-05, -8.963607251644135e-05, -8.441135287284851e-05, -7.918663322925568e-05, -7.396191358566284e-05, -6.873719394207001e-05, -6.351247429847717e-05, -5.828775465488434e-05, -5.3063035011291504e-05, -4.783831536769867e-05, -4.2613595724105835e-05, -3.7388876080513e-05, -3.2164156436920166e-05, -2.693943679332733e-05, -2.1714717149734497e-05, -1.6489997506141663e-05, -1.1265277862548828e-05, -6.040558218955994e-06, -8.158385753631592e-07, 4.408881068229675e-06, 9.63360071182251e-06, 1.4858320355415344e-05, 2.008303999900818e-05, 2.5307759642601013e-05, 3.053247928619385e-05, 3.575719892978668e-05, 4.0981918573379517e-05, 4.620663821697235e-05, 5.1431357860565186e-05, 5.665607750415802e-05, 6.188079714775085e-05, 6.710551679134369e-05, 7.233023643493652e-05, 7.755495607852936e-05, 8.277967572212219e-05, 8.800439536571503e-05, 9.322911500930786e-05, 9.84538346529007e-05, 0.00010367855429649353, 0.00010890327394008636, 0.0001141279935836792, 0.00011935271322727203, 0.00012457743287086487, 0.0001298021525144577, 0.00013502687215805054, 0.00014025159180164337, 0.0001454763114452362, 0.00015070103108882904, 0.00015592575073242188]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 5.0, 6.0, 5.0, 10.0, 17.0, 25.0, 15.0, 63.0, 104.0, 184.0, 418.0, 1155.0, 3856.0, 19141.0, 149111.0, 718847.0, 132845.0, 17342.0, 3495.0, 1074.0, 408.0, 201.0, 74.0, 62.0, 30.0, 23.0, 15.0, 10.0, 6.0, 10.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.60888671875, -0.5849838256835938, -0.5610809326171875, -0.5371780395507812, -0.513275146484375, -0.48937225341796875, -0.4654693603515625, -0.44156646728515625, -0.41766357421875, -0.39376068115234375, -0.3698577880859375, -0.34595489501953125, -0.322052001953125, -0.29814910888671875, -0.2742462158203125, -0.25034332275390625, -0.2264404296875, -0.20253753662109375, -0.1786346435546875, -0.15473175048828125, -0.130828857421875, -0.10692596435546875, -0.0830230712890625, -0.05912017822265625, -0.03521728515625, -0.01131439208984375, 0.0125885009765625, 0.03649139404296875, 0.060394287109375, 0.08429718017578125, 0.1082000732421875, 0.13210296630859375, 0.156005859375, 0.17990875244140625, 0.2038116455078125, 0.22771453857421875, 0.251617431640625, 0.27552032470703125, 0.2994232177734375, 0.32332611083984375, 0.34722900390625, 0.37113189697265625, 0.3950347900390625, 0.41893768310546875, 0.442840576171875, 0.46674346923828125, 0.4906463623046875, 0.5145492553710938, 0.5384521484375, 0.5623550415039062, 0.5862579345703125, 0.6101608276367188, 0.634063720703125, 0.6579666137695312, 0.6818695068359375, 0.7057723999023438, 0.72967529296875, 0.7535781860351562, 0.7774810791015625, 0.8013839721679688, 0.825286865234375, 0.8491897583007812, 0.8730926513671875, 0.8969955444335938, 0.9208984375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 7.0, 1.0, 12.0, 11.0, 10.0, 12.0, 19.0, 24.0, 23.0, 29.0, 38.0, 57.0, 55.0, 59.0, 71.0, 71.0, 67.0, 82.0, 46.0, 50.0, 62.0, 47.0, 34.0, 17.0, 20.0, 19.0, 15.0, 8.0, 8.0, 7.0, 3.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47998046875, -0.46233367919921875, -0.4446868896484375, -0.42704010009765625, -0.409393310546875, -0.39174652099609375, -0.3740997314453125, -0.35645294189453125, -0.33880615234375, -0.32115936279296875, -0.3035125732421875, -0.28586578369140625, -0.268218994140625, -0.25057220458984375, -0.2329254150390625, -0.21527862548828125, -0.1976318359375, -0.17998504638671875, -0.1623382568359375, -0.14469146728515625, -0.127044677734375, -0.10939788818359375, -0.0917510986328125, -0.07410430908203125, -0.05645751953125, -0.03881072998046875, -0.0211639404296875, -0.00351715087890625, 0.014129638671875, 0.03177642822265625, 0.0494232177734375, 0.06707000732421875, 0.084716796875, 0.10236358642578125, 0.1200103759765625, 0.13765716552734375, 0.155303955078125, 0.17295074462890625, 0.1905975341796875, 0.20824432373046875, 0.22589111328125, 0.24353790283203125, 0.2611846923828125, 0.27883148193359375, 0.296478271484375, 0.31412506103515625, 0.3317718505859375, 0.34941864013671875, 0.3670654296875, 0.38471221923828125, 0.4023590087890625, 0.42000579833984375, 0.437652587890625, 0.45529937744140625, 0.4729461669921875, 0.49059295654296875, 0.50823974609375, 0.5258865356445312, 0.5435333251953125, 0.5611801147460938, 0.578826904296875, 0.5964736938476562, 0.6141204833984375, 0.6317672729492188, 0.6494140625]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 5.0, 8.0, 4.0, 6.0, 23.0, 29.0, 82.0, 152.0, 238.0, 221.0, 123.0, 57.0, 20.0, 11.0, 5.0, 1.0, 3.0, 6.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-25.959287643432617, -25.39434242248535, -24.829397201538086, -24.26445198059082, -23.699506759643555, -23.13456153869629, -22.569616317749023, -22.004671096801758, -21.439725875854492, -20.874780654907227, -20.30983543395996, -19.744890213012695, -19.17994499206543, -18.614999771118164, -18.0500545501709, -17.485109329223633, -16.920166015625, -16.355220794677734, -15.790275573730469, -15.225330352783203, -14.660385131835938, -14.095439910888672, -13.530494689941406, -12.96554946899414, -12.400604248046875, -11.83565902709961, -11.270713806152344, -10.705768585205078, -10.140823364257812, -9.575878143310547, -9.010932922363281, -8.445987701416016, -7.881043434143066, -7.316098213195801, -6.751152992248535, -6.1862077713012695, -5.621262550354004, -5.056317329406738, -4.491372585296631, -3.9264273643493652, -3.3614821434020996, -2.796536922454834, -2.2315917015075684, -1.6666467189788818, -1.1017014980316162, -0.5367562770843506, 0.028188705444335938, 0.5931339263916016, 1.1580791473388672, 1.7230243682861328, 2.2879695892333984, 2.852914571762085, 3.4178597927093506, 3.982805013656616, 4.547749996185303, 5.112695217132568, 5.677640438079834, 6.2425856590271, 6.807530879974365, 7.372475624084473, 7.937420845031738, 8.502366065979004, 9.06731128692627, 9.632256507873535, 10.1972017288208]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 1.0, 0.0, 7.0, 7.0, 4.0, 1.0, 5.0, 8.0, 9.0, 17.0, 11.0, 15.0, 19.0, 19.0, 13.0, 30.0, 23.0, 28.0, 35.0, 48.0, 50.0, 68.0, 65.0, 64.0, 65.0, 53.0, 31.0, 33.0, 34.0, 24.0, 31.0, 23.0, 21.0, 17.0, 23.0, 18.0, 16.0, 12.0, 14.0, 6.0, 6.0, 9.0, 6.0, 4.0, 4.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.511778831481934, -9.186701774597168, -8.861624717712402, -8.536547660827637, -8.211470603942871, -7.8863935470581055, -7.561316013336182, -7.236238956451416, -6.91116189956665, -6.586084842681885, -6.261007785797119, -5.9359307289123535, -5.61085319519043, -5.285776138305664, -4.960699081420898, -4.635622024536133, -4.310544967651367, -3.9854679107666016, -3.660390853881836, -3.335313558578491, -3.0102365016937256, -2.68515944480896, -2.3600821495056152, -2.0350050926208496, -1.709928035736084, -1.3848509788513184, -1.0597738027572632, -0.7346966862678528, -0.4096195697784424, -0.08454251289367676, 0.24053466320037842, 0.5656118392944336, 0.8906879425048828, 1.2157649993896484, 1.5408421754837036, 1.8659193515777588, 2.1909964084625244, 2.51607346534729, 2.8411507606506348, 3.1662278175354004, 3.491304874420166, 3.8163819313049316, 4.141458988189697, 4.466536045074463, 4.791613578796387, 5.116690635681152, 5.441767692565918, 5.766844749450684, 6.091921806335449, 6.416998863220215, 6.7420759201049805, 7.067152976989746, 7.392230033874512, 7.717307090759277, 8.042384147644043, 8.367462158203125, 8.69253921508789, 9.017616271972656, 9.342693328857422, 9.667770385742188, 9.992847442626953, 10.317924499511719, 10.643001556396484, 10.96807861328125, 11.293155670166016]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 3.0, 5.0, 8.0, 19.0, 24.0, 25.0, 53.0, 97.0, 135.0, 228.0, 447.0, 803.0, 1634.0, 3162.0, 7332.0, 19006.0, 53564.0, 170576.0, 543762.0, 1378455.0, 1297000.0, 485051.0, 152190.0, 48621.0, 17743.0, 7332.0, 3466.0, 1650.0, 801.0, 442.0, 272.0, 147.0, 77.0, 56.0, 31.0, 20.0, 19.0, 8.0, 5.0, 6.0, 4.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.505859375, -0.4883880615234375, -0.470916748046875, -0.4534454345703125, -0.43597412109375, -0.4185028076171875, -0.401031494140625, -0.3835601806640625, -0.3660888671875, -0.3486175537109375, -0.331146240234375, -0.3136749267578125, -0.29620361328125, -0.2787322998046875, -0.261260986328125, -0.2437896728515625, -0.226318359375, -0.2088470458984375, -0.191375732421875, -0.1739044189453125, -0.15643310546875, -0.1389617919921875, -0.121490478515625, -0.1040191650390625, -0.0865478515625, -0.0690765380859375, -0.051605224609375, -0.0341339111328125, -0.01666259765625, 0.0008087158203125, 0.018280029296875, 0.0357513427734375, 0.05322265625, 0.0706939697265625, 0.088165283203125, 0.1056365966796875, 0.12310791015625, 0.1405792236328125, 0.158050537109375, 0.1755218505859375, 0.1929931640625, 0.2104644775390625, 0.227935791015625, 0.2454071044921875, 0.26287841796875, 0.2803497314453125, 0.297821044921875, 0.3152923583984375, 0.332763671875, 0.3502349853515625, 0.367706298828125, 0.3851776123046875, 0.40264892578125, 0.4201202392578125, 0.437591552734375, 0.4550628662109375, 0.4725341796875, 0.4900054931640625, 0.507476806640625, 0.5249481201171875, 0.54241943359375, 0.5598907470703125, 0.577362060546875, 0.5948333740234375, 0.6123046875]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 3.0, 1.0, 2.0, 6.0, 8.0, 12.0, 9.0, 14.0, 17.0, 14.0, 20.0, 22.0, 28.0, 35.0, 37.0, 47.0, 46.0, 55.0, 45.0, 53.0, 52.0, 61.0, 52.0, 50.0, 40.0, 47.0, 34.0, 26.0, 33.0, 22.0, 27.0, 22.0, 14.0, 14.0, 12.0, 8.0, 4.0, 5.0, 3.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.96484375, -0.9368820190429688, -0.9089202880859375, -0.8809585571289062, -0.852996826171875, -0.8250350952148438, -0.7970733642578125, -0.7691116333007812, -0.74114990234375, -0.7131881713867188, -0.6852264404296875, -0.6572647094726562, -0.629302978515625, -0.6013412475585938, -0.5733795166015625, -0.5454177856445312, -0.5174560546875, -0.48949432373046875, -0.4615325927734375, -0.43357086181640625, -0.405609130859375, -0.37764739990234375, -0.3496856689453125, -0.32172393798828125, -0.29376220703125, -0.26580047607421875, -0.2378387451171875, -0.20987701416015625, -0.181915283203125, -0.15395355224609375, -0.1259918212890625, -0.09803009033203125, -0.070068359375, -0.04210662841796875, -0.0141448974609375, 0.01381683349609375, 0.041778564453125, 0.06974029541015625, 0.0977020263671875, 0.12566375732421875, 0.15362548828125, 0.18158721923828125, 0.2095489501953125, 0.23751068115234375, 0.265472412109375, 0.29343414306640625, 0.3213958740234375, 0.34935760498046875, 0.3773193359375, 0.40528106689453125, 0.4332427978515625, 0.46120452880859375, 0.489166259765625, 0.5171279907226562, 0.5450897216796875, 0.5730514526367188, 0.60101318359375, 0.6289749145507812, 0.6569366455078125, 0.6848983764648438, 0.712860107421875, 0.7408218383789062, 0.7687835693359375, 0.7967453002929688, 0.82470703125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 3.0, 8.0, 9.0, 19.0, 24.0, 23.0, 67.0, 121.0, 305.0, 893.0, 3611.0, 26262.0, 1118193.0, 2988474.0, 48750.0, 5562.0, 1213.0, 391.0, 142.0, 79.0, 44.0, 24.0, 16.0, 15.0, 10.0, 6.0, 7.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.236328125, -2.164459228515625, -2.09259033203125, -2.020721435546875, -1.9488525390625, -1.876983642578125, -1.80511474609375, -1.733245849609375, -1.661376953125, -1.589508056640625, -1.51763916015625, -1.445770263671875, -1.3739013671875, -1.302032470703125, -1.23016357421875, -1.158294677734375, -1.08642578125, -1.014556884765625, -0.94268798828125, -0.870819091796875, -0.7989501953125, -0.727081298828125, -0.65521240234375, -0.583343505859375, -0.511474609375, -0.439605712890625, -0.36773681640625, -0.295867919921875, -0.2239990234375, -0.152130126953125, -0.08026123046875, -0.008392333984375, 0.0634765625, 0.135345458984375, 0.20721435546875, 0.279083251953125, 0.3509521484375, 0.422821044921875, 0.49468994140625, 0.566558837890625, 0.638427734375, 0.710296630859375, 0.78216552734375, 0.854034423828125, 0.9259033203125, 0.997772216796875, 1.06964111328125, 1.141510009765625, 1.21337890625, 1.285247802734375, 1.35711669921875, 1.428985595703125, 1.5008544921875, 1.572723388671875, 1.64459228515625, 1.716461181640625, 1.788330078125, 1.860198974609375, 1.93206787109375, 2.003936767578125, 2.0758056640625, 2.147674560546875, 2.21954345703125, 2.291412353515625, 2.36328125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 8.0, 8.0, 2.0, 6.0, 7.0, 17.0, 17.0, 29.0, 39.0, 64.0, 74.0, 116.0, 174.0, 272.0, 369.0, 480.0, 539.0, 497.0, 414.0, 277.0, 209.0, 134.0, 81.0, 62.0, 41.0, 30.0, 17.0, 18.0, 14.0, 6.0, 8.0, 13.0, 5.0, 4.0, 5.0, 3.0, 1.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.2529296875, -1.213226318359375, -1.17352294921875, -1.133819580078125, -1.0941162109375, -1.054412841796875, -1.01470947265625, -0.975006103515625, -0.935302734375, -0.895599365234375, -0.85589599609375, -0.816192626953125, -0.7764892578125, -0.736785888671875, -0.69708251953125, -0.657379150390625, -0.61767578125, -0.577972412109375, -0.53826904296875, -0.498565673828125, -0.4588623046875, -0.419158935546875, -0.37945556640625, -0.339752197265625, -0.300048828125, -0.260345458984375, -0.22064208984375, -0.180938720703125, -0.1412353515625, -0.101531982421875, -0.06182861328125, -0.022125244140625, 0.017578125, 0.057281494140625, 0.09698486328125, 0.136688232421875, 0.1763916015625, 0.216094970703125, 0.25579833984375, 0.295501708984375, 0.335205078125, 0.374908447265625, 0.41461181640625, 0.454315185546875, 0.4940185546875, 0.533721923828125, 0.57342529296875, 0.613128662109375, 0.65283203125, 0.692535400390625, 0.73223876953125, 0.771942138671875, 0.8116455078125, 0.851348876953125, 0.89105224609375, 0.930755615234375, 0.970458984375, 1.010162353515625, 1.04986572265625, 1.089569091796875, 1.1292724609375, 1.168975830078125, 1.20867919921875, 1.248382568359375, 1.2880859375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 5.0, 3.0, 10.0, 13.0, 22.0, 33.0, 84.0, 125.0, 180.0, 187.0, 146.0, 86.0, 46.0, 22.0, 19.0, 11.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.760187149047852, -10.333600997924805, -9.907015800476074, -9.480429649353027, -9.05384349822998, -8.62725830078125, -8.200672149658203, -7.774085998535156, -7.347500324249268, -6.920914649963379, -6.494328498840332, -6.067742824554443, -5.641157150268555, -5.214570999145508, -4.787985324859619, -4.3613996505737305, -3.9348134994506836, -3.508227586746216, -3.081641674041748, -2.6550559997558594, -2.2284700870513916, -1.8018841743469238, -1.3752985000610352, -0.9487125873565674, -0.5221266746520996, -0.09554082155227661, 0.3310450315475464, 0.7576308250427246, 1.1842167377471924, 1.6108026504516602, 2.037388324737549, 2.4639742374420166, 2.8905601501464844, 3.317146062850952, 3.74373197555542, 4.170317649841309, 4.5969038009643555, 5.023489475250244, 5.450075149536133, 5.87666130065918, 6.303246974945068, 6.729832649230957, 7.156418800354004, 7.583004474639893, 8.009590148925781, 8.436176300048828, 8.862762451171875, 9.289347648620605, 9.715933799743652, 10.1425199508667, 10.56910514831543, 10.995691299438477, 11.422277450561523, 11.84886360168457, 12.2754487991333, 12.702034950256348, 13.128620147705078, 13.555206298828125, 13.981791496276855, 14.408377647399902, 14.83496379852295, 15.26154899597168, 15.688135147094727, 16.114721298217773, 16.54130744934082]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 2.0, 6.0, 7.0, 8.0, 9.0, 20.0, 11.0, 13.0, 15.0, 36.0, 21.0, 36.0, 39.0, 54.0, 47.0, 41.0, 45.0, 39.0, 54.0, 61.0, 36.0, 34.0, 50.0, 45.0, 42.0, 41.0, 26.0, 20.0, 33.0, 20.0, 15.0, 20.0, 12.0, 12.0, 9.0, 4.0, 3.0, 5.0, 4.0, 3.0, 4.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.060419082641602, -5.824182987213135, -5.58794641494751, -5.351710319519043, -5.115473747253418, -4.879237651824951, -4.643001556396484, -4.406764984130859, -4.170528888702393, -3.9342925548553467, -3.698056221008301, -3.461820125579834, -3.225583791732788, -2.989347457885742, -2.7531113624572754, -2.5168750286102295, -2.2806386947631836, -2.0444023609161377, -1.8081661462783813, -1.571929931640625, -1.335693597793579, -1.0994572639465332, -0.8632210493087769, -0.6269848346710205, -0.3907485008239746, -0.1545122265815735, 0.08172404766082764, 0.31796032190322876, 0.5541965961456299, 0.7904329299926758, 1.0266691446304321, 1.2629053592681885, 1.4991416931152344, 1.7353780269622803, 1.9716142416000366, 2.207850456237793, 2.444086790084839, 2.6803231239318848, 2.9165592193603516, 3.1527955532073975, 3.3890318870544434, 3.6252682209014893, 3.861504554748535, 4.097740650177002, 4.333976745605469, 4.570213317871094, 4.8064494132995605, 5.042685508728027, 5.278922080993652, 5.515158176422119, 5.751394748687744, 5.987630844116211, 6.223867416381836, 6.460103511810303, 6.6963396072387695, 6.9325761795043945, 7.168812274932861, 7.405048370361328, 7.641284942626953, 7.87752103805542, 8.113757133483887, 8.349993705749512, 8.586230278015137, 8.822465896606445, 9.05870246887207]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 3.0, 4.0, 6.0, 10.0, 10.0, 10.0, 29.0, 46.0, 60.0, 73.0, 124.0, 169.0, 240.0, 433.0, 617.0, 1035.0, 1843.0, 3038.0, 5518.0, 10755.0, 20852.0, 41717.0, 83479.0, 159600.0, 244352.0, 217691.0, 125873.0, 63769.0, 31999.0, 16073.0, 8327.0, 4483.0, 2490.0, 1396.0, 890.0, 546.0, 327.0, 220.0, 135.0, 104.0, 56.0, 56.0, 31.0, 19.0, 13.0, 13.0, 8.0, 6.0, 3.0, 4.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.76953125, -0.7445526123046875, -0.719573974609375, -0.6945953369140625, -0.66961669921875, -0.6446380615234375, -0.619659423828125, -0.5946807861328125, -0.5697021484375, -0.5447235107421875, -0.519744873046875, -0.4947662353515625, -0.46978759765625, -0.4448089599609375, -0.419830322265625, -0.3948516845703125, -0.369873046875, -0.3448944091796875, -0.319915771484375, -0.2949371337890625, -0.26995849609375, -0.2449798583984375, -0.220001220703125, -0.1950225830078125, -0.1700439453125, -0.1450653076171875, -0.120086669921875, -0.0951080322265625, -0.07012939453125, -0.0451507568359375, -0.020172119140625, 0.0048065185546875, 0.02978515625, 0.0547637939453125, 0.079742431640625, 0.1047210693359375, 0.12969970703125, 0.1546783447265625, 0.179656982421875, 0.2046356201171875, 0.2296142578125, 0.2545928955078125, 0.279571533203125, 0.3045501708984375, 0.32952880859375, 0.3545074462890625, 0.379486083984375, 0.4044647216796875, 0.429443359375, 0.4544219970703125, 0.479400634765625, 0.5043792724609375, 0.52935791015625, 0.5543365478515625, 0.579315185546875, 0.6042938232421875, 0.6292724609375, 0.6542510986328125, 0.679229736328125, 0.7042083740234375, 0.72918701171875, 0.7541656494140625, 0.779144287109375, 0.8041229248046875, 0.8291015625]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 5.0, 6.0, 7.0, 6.0, 7.0, 13.0, 18.0, 19.0, 25.0, 24.0, 31.0, 33.0, 33.0, 42.0, 45.0, 41.0, 59.0, 58.0, 50.0, 59.0, 52.0, 41.0, 43.0, 52.0, 38.0, 37.0, 27.0, 26.0, 21.0, 24.0, 13.0, 6.0, 11.0, 7.0, 7.0, 5.0, 2.0, 5.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.0009765625, -0.9727554321289062, -0.9445343017578125, -0.9163131713867188, -0.888092041015625, -0.8598709106445312, -0.8316497802734375, -0.8034286499023438, -0.77520751953125, -0.7469863891601562, -0.7187652587890625, -0.6905441284179688, -0.662322998046875, -0.6341018676757812, -0.6058807373046875, -0.5776596069335938, -0.5494384765625, -0.5212173461914062, -0.4929962158203125, -0.46477508544921875, -0.436553955078125, -0.40833282470703125, -0.3801116943359375, -0.35189056396484375, -0.32366943359375, -0.29544830322265625, -0.2672271728515625, -0.23900604248046875, -0.210784912109375, -0.18256378173828125, -0.1543426513671875, -0.12612152099609375, -0.097900390625, -0.06967926025390625, -0.0414581298828125, -0.01323699951171875, 0.014984130859375, 0.04320526123046875, 0.0714263916015625, 0.09964752197265625, 0.12786865234375, 0.15608978271484375, 0.1843109130859375, 0.21253204345703125, 0.240753173828125, 0.26897430419921875, 0.2971954345703125, 0.32541656494140625, 0.3536376953125, 0.38185882568359375, 0.4100799560546875, 0.43830108642578125, 0.466522216796875, 0.49474334716796875, 0.5229644775390625, 0.5511856079101562, 0.57940673828125, 0.6076278686523438, 0.6358489990234375, 0.6640701293945312, 0.692291259765625, 0.7205123901367188, 0.7487335205078125, 0.7769546508789062, 0.80517578125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 6.0, 4.0, 5.0, 14.0, 6.0, 25.0, 22.0, 32.0, 37.0, 52.0, 60.0, 77.0, 120.0, 182.0, 251.0, 357.0, 573.0, 1008.0, 1917.0, 5098.0, 16786.0, 71799.0, 439197.0, 412825.0, 71463.0, 16759.0, 4950.0, 1994.0, 943.0, 577.0, 384.0, 273.0, 160.0, 150.0, 105.0, 76.0, 55.0, 39.0, 43.0, 27.0, 32.0, 18.0, 19.0, 13.0, 4.0, 6.0, 2.0, 3.0, 0.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-1.6162109375, -1.5640716552734375, -1.511932373046875, -1.4597930908203125, -1.40765380859375, -1.3555145263671875, -1.303375244140625, -1.2512359619140625, -1.1990966796875, -1.1469573974609375, -1.094818115234375, -1.0426788330078125, -0.99053955078125, -0.9384002685546875, -0.886260986328125, -0.8341217041015625, -0.781982421875, -0.7298431396484375, -0.677703857421875, -0.6255645751953125, -0.57342529296875, -0.5212860107421875, -0.469146728515625, -0.4170074462890625, -0.3648681640625, -0.3127288818359375, -0.260589599609375, -0.2084503173828125, -0.15631103515625, -0.1041717529296875, -0.052032470703125, 0.0001068115234375, 0.05224609375, 0.1043853759765625, 0.156524658203125, 0.2086639404296875, 0.26080322265625, 0.3129425048828125, 0.365081787109375, 0.4172210693359375, 0.4693603515625, 0.5214996337890625, 0.573638916015625, 0.6257781982421875, 0.67791748046875, 0.7300567626953125, 0.782196044921875, 0.8343353271484375, 0.886474609375, 0.9386138916015625, 0.990753173828125, 1.0428924560546875, 1.09503173828125, 1.1471710205078125, 1.199310302734375, 1.2514495849609375, 1.3035888671875, 1.3557281494140625, 1.407867431640625, 1.4600067138671875, 1.51214599609375, 1.5642852783203125, 1.616424560546875, 1.6685638427734375, 1.720703125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 5.0, 1.0, 1.0, 5.0, 3.0, 7.0, 9.0, 14.0, 16.0, 10.0, 14.0, 19.0, 26.0, 29.0, 48.0, 34.0, 46.0, 38.0, 46.0, 47.0, 58.0, 58.0, 35.0, 55.0, 45.0, 46.0, 34.0, 40.0, 34.0, 35.0, 21.0, 26.0, 19.0, 10.0, 11.0, 11.0, 12.0, 14.0, 9.0, 2.0, 4.0, 5.0, 5.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.71875, -2.6295166015625, -2.540283203125, -2.4510498046875, -2.36181640625, -2.2725830078125, -2.183349609375, -2.0941162109375, -2.0048828125, -1.9156494140625, -1.826416015625, -1.7371826171875, -1.64794921875, -1.5587158203125, -1.469482421875, -1.3802490234375, -1.291015625, -1.2017822265625, -1.112548828125, -1.0233154296875, -0.93408203125, -0.8448486328125, -0.755615234375, -0.6663818359375, -0.5771484375, -0.4879150390625, -0.398681640625, -0.3094482421875, -0.22021484375, -0.1309814453125, -0.041748046875, 0.0474853515625, 0.13671875, 0.2259521484375, 0.315185546875, 0.4044189453125, 0.49365234375, 0.5828857421875, 0.672119140625, 0.7613525390625, 0.8505859375, 0.9398193359375, 1.029052734375, 1.1182861328125, 1.20751953125, 1.2967529296875, 1.385986328125, 1.4752197265625, 1.564453125, 1.6536865234375, 1.742919921875, 1.8321533203125, 1.92138671875, 2.0106201171875, 2.099853515625, 2.1890869140625, 2.2783203125, 2.3675537109375, 2.456787109375, 2.5460205078125, 2.63525390625, 2.7244873046875, 2.813720703125, 2.9029541015625, 2.9921875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 7.0, 4.0, 4.0, 8.0, 11.0, 11.0, 16.0, 25.0, 38.0, 46.0, 51.0, 82.0, 167.0, 259.0, 444.0, 929.0, 1916.0, 4834.0, 13566.0, 44427.0, 174811.0, 628148.0, 126864.0, 33769.0, 10707.0, 3905.0, 1652.0, 757.0, 435.0, 242.0, 133.0, 76.0, 67.0, 48.0, 25.0, 18.0, 10.0, 13.0, 3.0, 9.0, 8.0, 6.0, 6.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.435546875, -0.4221000671386719, -0.40865325927734375, -0.3952064514160156, -0.3817596435546875, -0.3683128356933594, -0.35486602783203125, -0.3414192199707031, -0.327972412109375, -0.3145256042480469, -0.30107879638671875, -0.2876319885253906, -0.2741851806640625, -0.2607383728027344, -0.24729156494140625, -0.23384475708007812, -0.22039794921875, -0.20695114135742188, -0.19350433349609375, -0.18005752563476562, -0.1666107177734375, -0.15316390991210938, -0.13971710205078125, -0.12627029418945312, -0.112823486328125, -0.09937667846679688, -0.08592987060546875, -0.07248306274414062, -0.0590362548828125, -0.045589447021484375, -0.03214263916015625, -0.018695831298828125, -0.0052490234375, 0.008197784423828125, 0.02164459228515625, 0.035091400146484375, 0.0485382080078125, 0.061985015869140625, 0.07543182373046875, 0.08887863159179688, 0.102325439453125, 0.11577224731445312, 0.12921905517578125, 0.14266586303710938, 0.1561126708984375, 0.16955947875976562, 0.18300628662109375, 0.19645309448242188, 0.20989990234375, 0.22334671020507812, 0.23679351806640625, 0.2502403259277344, 0.2636871337890625, 0.2771339416503906, 0.29058074951171875, 0.3040275573730469, 0.317474365234375, 0.3309211730957031, 0.34436798095703125, 0.3578147888183594, 0.3712615966796875, 0.3847084045410156, 0.39815521240234375, 0.4116020202636719, 0.425048828125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 6.0, 4.0, 5.0, 8.0, 9.0, 16.0, 16.0, 23.0, 48.0, 71.0, 89.0, 125.0, 135.0, 119.0, 100.0, 67.0, 44.0, 29.0, 26.0, 23.0, 15.0, 6.0, 4.0, 2.0, 3.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00023281574249267578, -0.00022627972066402435, -0.00021974369883537292, -0.0002132076770067215, -0.00020667165517807007, -0.00020013563334941864, -0.0001935996115207672, -0.00018706358969211578, -0.00018052756786346436, -0.00017399154603481293, -0.0001674555242061615, -0.00016091950237751007, -0.00015438348054885864, -0.00014784745872020721, -0.00014131143689155579, -0.00013477541506290436, -0.00012823939323425293, -0.0001217033714056015, -0.00011516734957695007, -0.00010863132774829865, -0.00010209530591964722, -9.555928409099579e-05, -8.902326226234436e-05, -8.248724043369293e-05, -7.59512186050415e-05, -6.941519677639008e-05, -6.287917494773865e-05, -5.634315311908722e-05, -4.980713129043579e-05, -4.327110946178436e-05, -3.6735087633132935e-05, -3.0199065804481506e-05, -2.3663043975830078e-05, -1.712702214717865e-05, -1.0591000318527222e-05, -4.0549784898757935e-06, 2.4810433387756348e-06, 9.017065167427063e-06, 1.555308699607849e-05, 2.208910882472992e-05, 2.8625130653381348e-05, 3.5161152482032776e-05, 4.1697174310684204e-05, 4.823319613933563e-05, 5.476921796798706e-05, 6.130523979663849e-05, 6.784126162528992e-05, 7.437728345394135e-05, 8.091330528259277e-05, 8.74493271112442e-05, 9.398534893989563e-05, 0.00010052137076854706, 0.00010705739259719849, 0.00011359341442584991, 0.00012012943625450134, 0.00012666545808315277, 0.0001332014799118042, 0.00013973750174045563, 0.00014627352356910706, 0.00015280954539775848, 0.0001593455672264099, 0.00016588158905506134, 0.00017241761088371277, 0.0001789536327123642, 0.00018548965454101562]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 7.0, 5.0, 13.0, 17.0, 21.0, 30.0, 57.0, 113.0, 177.0, 316.0, 620.0, 1553.0, 4644.0, 19043.0, 118800.0, 740728.0, 133734.0, 20729.0, 4984.0, 1585.0, 672.0, 296.0, 175.0, 92.0, 56.0, 34.0, 12.0, 14.0, 8.0, 6.0, 5.0, 6.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.72265625, -0.7038993835449219, -0.6851425170898438, -0.6663856506347656, -0.6476287841796875, -0.6288719177246094, -0.6101150512695312, -0.5913581848144531, -0.572601318359375, -0.5538444519042969, -0.5350875854492188, -0.5163307189941406, -0.4975738525390625, -0.4788169860839844, -0.46006011962890625, -0.4413032531738281, -0.42254638671875, -0.4037895202636719, -0.38503265380859375, -0.3662757873535156, -0.3475189208984375, -0.3287620544433594, -0.31000518798828125, -0.2912483215332031, -0.272491455078125, -0.2537345886230469, -0.23497772216796875, -0.21622085571289062, -0.1974639892578125, -0.17870712280273438, -0.15995025634765625, -0.14119338989257812, -0.1224365234375, -0.10367965698242188, -0.08492279052734375, -0.06616592407226562, -0.0474090576171875, -0.028652191162109375, -0.00989532470703125, 0.008861541748046875, 0.027618408203125, 0.046375274658203125, 0.06513214111328125, 0.08388900756835938, 0.1026458740234375, 0.12140274047851562, 0.14015960693359375, 0.15891647338867188, 0.17767333984375, 0.19643020629882812, 0.21518707275390625, 0.23394393920898438, 0.2527008056640625, 0.2714576721191406, 0.29021453857421875, 0.3089714050292969, 0.327728271484375, 0.3464851379394531, 0.36524200439453125, 0.3839988708496094, 0.4027557373046875, 0.4215126037597656, 0.44026947021484375, 0.4590263366699219, 0.477783203125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 7.0, 6.0, 1.0, 5.0, 11.0, 13.0, 20.0, 29.0, 34.0, 49.0, 82.0, 100.0, 102.0, 102.0, 119.0, 83.0, 77.0, 44.0, 34.0, 23.0, 19.0, 16.0, 12.0, 5.0, 5.0, 4.0, 5.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.59619140625, -0.5746002197265625, -0.553009033203125, -0.5314178466796875, -0.50982666015625, -0.4882354736328125, -0.466644287109375, -0.4450531005859375, -0.4234619140625, -0.4018707275390625, -0.380279541015625, -0.3586883544921875, -0.33709716796875, -0.3155059814453125, -0.293914794921875, -0.2723236083984375, -0.250732421875, -0.2291412353515625, -0.207550048828125, -0.1859588623046875, -0.16436767578125, -0.1427764892578125, -0.121185302734375, -0.0995941162109375, -0.0780029296875, -0.0564117431640625, -0.034820556640625, -0.0132293701171875, 0.00836181640625, 0.0299530029296875, 0.051544189453125, 0.0731353759765625, 0.0947265625, 0.1163177490234375, 0.137908935546875, 0.1595001220703125, 0.18109130859375, 0.2026824951171875, 0.224273681640625, 0.2458648681640625, 0.2674560546875, 0.2890472412109375, 0.310638427734375, 0.3322296142578125, 0.35382080078125, 0.3754119873046875, 0.397003173828125, 0.4185943603515625, 0.440185546875, 0.4617767333984375, 0.483367919921875, 0.5049591064453125, 0.52655029296875, 0.5481414794921875, 0.569732666015625, 0.5913238525390625, 0.6129150390625, 0.6345062255859375, 0.656097412109375, 0.6776885986328125, 0.69927978515625, 0.7208709716796875, 0.742462158203125, 0.7640533447265625, 0.78564453125]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 4.0, 11.0, 7.0, 16.0, 47.0, 63.0, 111.0, 190.0, 291.0, 123.0, 65.0, 36.0, 17.0, 5.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.890586853027344, -19.39608383178711, -18.901580810546875, -18.40707778930664, -17.912574768066406, -17.418071746826172, -16.923568725585938, -16.429065704345703, -15.934563636779785, -15.44006061553955, -14.945557594299316, -14.451054573059082, -13.956552505493164, -13.46204948425293, -12.967546463012695, -12.473043441772461, -11.978540420532227, -11.484037399291992, -10.989534378051758, -10.495031356811523, -10.000528335571289, -9.506025314331055, -9.011523246765137, -8.517020225524902, -8.022517204284668, -7.528014183044434, -7.033511161804199, -6.539008617401123, -6.044505596160889, -5.550002574920654, -5.055500030517578, -4.560997009277344, -4.066493988037109, -3.571990966796875, -3.0774881839752197, -2.5829854011535645, -2.08848237991333, -1.5939793586730957, -1.0994765758514404, -0.6049737930297852, -0.11047077178955078, 0.38403213024139404, 0.8785350322723389, 1.3730379343032837, 1.8675408363342285, 2.362043857574463, 2.856546640396118, 3.3510494232177734, 3.845552444458008, 4.340055465698242, 4.834558486938477, 5.329061031341553, 5.823564052581787, 6.3180670738220215, 6.812569618225098, 7.307072639465332, 7.801575660705566, 8.2960786819458, 8.790581703186035, 9.28508472442627, 9.779586791992188, 10.274089813232422, 10.768592834472656, 11.26309585571289, 11.757598876953125]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 5.0, 2.0, 2.0, 6.0, 2.0, 10.0, 6.0, 12.0, 20.0, 14.0, 16.0, 19.0, 23.0, 18.0, 25.0, 26.0, 21.0, 41.0, 46.0, 46.0, 95.0, 115.0, 70.0, 49.0, 34.0, 35.0, 29.0, 31.0, 26.0, 29.0, 21.0, 19.0, 13.0, 10.0, 11.0, 10.0, 6.0, 10.0, 6.0, 7.0, 5.0, 5.0, 3.0, 6.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.874667167663574, -9.539567947387695, -9.204469680786133, -8.86937141418457, -8.534272193908691, -8.199172973632812, -7.86407470703125, -7.528975963592529, -7.193877220153809, -6.858778476715088, -6.523679733276367, -6.1885809898376465, -5.853482246398926, -5.518383502960205, -5.183284759521484, -4.848186016082764, -4.513087272644043, -4.177988529205322, -3.8428897857666016, -3.507791042327881, -3.17269229888916, -2.8375935554504395, -2.5024948120117188, -2.167396068572998, -1.8322973251342773, -1.4971985816955566, -1.162099838256836, -0.8270010948181152, -0.49190235137939453, -0.15680360794067383, 0.17829513549804688, 0.5133938789367676, 0.8484916687011719, 1.1835904121398926, 1.5186891555786133, 1.853787899017334, 2.1888866424560547, 2.5239853858947754, 2.859084129333496, 3.194182872772217, 3.5292816162109375, 3.864380359649658, 4.199479103088379, 4.5345778465271, 4.86967658996582, 5.204775333404541, 5.539874076843262, 5.874972820281982, 6.210071563720703, 6.545170307159424, 6.8802690505981445, 7.215367794036865, 7.550466537475586, 7.885565280914307, 8.220664024353027, 8.555763244628906, 8.890861511230469, 9.225959777832031, 9.56105899810791, 9.896158218383789, 10.231256484985352, 10.566354751586914, 10.901453971862793, 11.236553192138672, 11.571651458740234]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 3.0, 8.0, 12.0, 21.0, 18.0, 25.0, 42.0, 60.0, 88.0, 153.0, 223.0, 380.0, 596.0, 1143.0, 2323.0, 5442.0, 14369.0, 42554.0, 144867.0, 488748.0, 1296868.0, 1409177.0, 549073.0, 161110.0, 48314.0, 16360.0, 6426.0, 2770.0, 1377.0, 691.0, 373.0, 221.0, 133.0, 99.0, 63.0, 52.0, 22.0, 24.0, 17.0, 13.0, 5.0, 6.0, 3.0, 5.0, 6.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.65185546875, -0.6327133178710938, -0.6135711669921875, -0.5944290161132812, -0.575286865234375, -0.5561447143554688, -0.5370025634765625, -0.5178604125976562, -0.49871826171875, -0.47957611083984375, -0.4604339599609375, -0.44129180908203125, -0.422149658203125, -0.40300750732421875, -0.3838653564453125, -0.36472320556640625, -0.3455810546875, -0.32643890380859375, -0.3072967529296875, -0.28815460205078125, -0.269012451171875, -0.24987030029296875, -0.2307281494140625, -0.21158599853515625, -0.19244384765625, -0.17330169677734375, -0.1541595458984375, -0.13501739501953125, -0.115875244140625, -0.09673309326171875, -0.0775909423828125, -0.05844879150390625, -0.039306640625, -0.02016448974609375, -0.0010223388671875, 0.01811981201171875, 0.037261962890625, 0.05640411376953125, 0.0755462646484375, 0.09468841552734375, 0.11383056640625, 0.13297271728515625, 0.1521148681640625, 0.17125701904296875, 0.190399169921875, 0.20954132080078125, 0.2286834716796875, 0.24782562255859375, 0.2669677734375, 0.28610992431640625, 0.3052520751953125, 0.32439422607421875, 0.343536376953125, 0.36267852783203125, 0.3818206787109375, 0.40096282958984375, 0.42010498046875, 0.43924713134765625, 0.4583892822265625, 0.47753143310546875, 0.496673583984375, 0.5158157348632812, 0.5349578857421875, 0.5541000366210938, 0.5732421875]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 1.0, 5.0, 4.0, 8.0, 7.0, 6.0, 15.0, 10.0, 26.0, 17.0, 29.0, 28.0, 36.0, 36.0, 47.0, 37.0, 54.0, 45.0, 52.0, 57.0, 41.0, 48.0, 44.0, 52.0, 37.0, 30.0, 37.0, 35.0, 35.0, 26.0, 19.0, 15.0, 10.0, 16.0, 8.0, 9.0, 6.0, 5.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.96484375, -0.9371109008789062, -0.9093780517578125, -0.8816452026367188, -0.853912353515625, -0.8261795043945312, -0.7984466552734375, -0.7707138061523438, -0.74298095703125, -0.7152481079101562, -0.6875152587890625, -0.6597824096679688, -0.632049560546875, -0.6043167114257812, -0.5765838623046875, -0.5488510131835938, -0.5211181640625, -0.49338531494140625, -0.4656524658203125, -0.43791961669921875, -0.410186767578125, -0.38245391845703125, -0.3547210693359375, -0.32698822021484375, -0.29925537109375, -0.27152252197265625, -0.2437896728515625, -0.21605682373046875, -0.188323974609375, -0.16059112548828125, -0.1328582763671875, -0.10512542724609375, -0.077392578125, -0.04965972900390625, -0.0219268798828125, 0.00580596923828125, 0.033538818359375, 0.06127166748046875, 0.0890045166015625, 0.11673736572265625, 0.14447021484375, 0.17220306396484375, 0.1999359130859375, 0.22766876220703125, 0.255401611328125, 0.28313446044921875, 0.3108673095703125, 0.33860015869140625, 0.3663330078125, 0.39406585693359375, 0.4217987060546875, 0.44953155517578125, 0.477264404296875, 0.5049972534179688, 0.5327301025390625, 0.5604629516601562, 0.58819580078125, 0.6159286499023438, 0.6436614990234375, 0.6713943481445312, 0.699127197265625, 0.7268600463867188, 0.7545928955078125, 0.7823257446289062, 0.81005859375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 0.0, 1.0, 5.0, 4.0, 4.0, 5.0, 10.0, 22.0, 21.0, 18.0, 38.0, 84.0, 159.0, 279.0, 655.0, 2138.0, 12122.0, 157344.0, 3646417.0, 349956.0, 19916.0, 3219.0, 982.0, 398.0, 201.0, 107.0, 62.0, 35.0, 30.0, 17.0, 12.0, 10.0, 3.0, 6.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9404296875, -1.8770294189453125, -1.813629150390625, -1.7502288818359375, -1.68682861328125, -1.6234283447265625, -1.560028076171875, -1.4966278076171875, -1.4332275390625, -1.3698272705078125, -1.306427001953125, -1.2430267333984375, -1.17962646484375, -1.1162261962890625, -1.052825927734375, -0.9894256591796875, -0.926025390625, -0.8626251220703125, -0.799224853515625, -0.7358245849609375, -0.67242431640625, -0.6090240478515625, -0.545623779296875, -0.4822235107421875, -0.4188232421875, -0.3554229736328125, -0.292022705078125, -0.2286224365234375, -0.16522216796875, -0.1018218994140625, -0.038421630859375, 0.0249786376953125, 0.08837890625, 0.1517791748046875, 0.215179443359375, 0.2785797119140625, 0.34197998046875, 0.4053802490234375, 0.468780517578125, 0.5321807861328125, 0.5955810546875, 0.6589813232421875, 0.722381591796875, 0.7857818603515625, 0.84918212890625, 0.9125823974609375, 0.975982666015625, 1.0393829345703125, 1.102783203125, 1.1661834716796875, 1.229583740234375, 1.2929840087890625, 1.35638427734375, 1.4197845458984375, 1.483184814453125, 1.5465850830078125, 1.6099853515625, 1.6733856201171875, 1.736785888671875, 1.8001861572265625, 1.86358642578125, 1.9269866943359375, 1.990386962890625, 2.0537872314453125, 2.1171875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 6.0, 3.0, 5.0, 5.0, 14.0, 5.0, 9.0, 14.0, 21.0, 26.0, 39.0, 76.0, 105.0, 146.0, 210.0, 312.0, 416.0, 503.0, 515.0, 498.0, 333.0, 230.0, 163.0, 115.0, 61.0, 60.0, 40.0, 41.0, 30.0, 24.0, 16.0, 5.0, 10.0, 5.0, 4.0, 4.0, 3.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.92041015625, -0.8788375854492188, -0.8372650146484375, -0.7956924438476562, -0.754119873046875, -0.7125473022460938, -0.6709747314453125, -0.6294021606445312, -0.58782958984375, -0.5462570190429688, -0.5046844482421875, -0.46311187744140625, -0.421539306640625, -0.37996673583984375, -0.3383941650390625, -0.29682159423828125, -0.2552490234375, -0.21367645263671875, -0.1721038818359375, -0.13053131103515625, -0.088958740234375, -0.04738616943359375, -0.0058135986328125, 0.03575897216796875, 0.07733154296875, 0.11890411376953125, 0.1604766845703125, 0.20204925537109375, 0.243621826171875, 0.28519439697265625, 0.3267669677734375, 0.36833953857421875, 0.409912109375, 0.45148468017578125, 0.4930572509765625, 0.5346298217773438, 0.576202392578125, 0.6177749633789062, 0.6593475341796875, 0.7009201049804688, 0.74249267578125, 0.7840652465820312, 0.8256378173828125, 0.8672103881835938, 0.908782958984375, 0.9503555297851562, 0.9919281005859375, 1.0335006713867188, 1.0750732421875, 1.1166458129882812, 1.1582183837890625, 1.1997909545898438, 1.241363525390625, 1.2829360961914062, 1.3245086669921875, 1.3660812377929688, 1.40765380859375, 1.4492263793945312, 1.4907989501953125, 1.5323715209960938, 1.573944091796875, 1.6155166625976562, 1.6570892333984375, 1.6986618041992188, 1.740234375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 9.0, 22.0, 31.0, 70.0, 106.0, 165.0, 183.0, 148.0, 113.0, 62.0, 31.0, 12.0, 15.0, 7.0, 9.0, 5.0, 1.0, 4.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.9807820320129395, -6.546756267547607, -6.112730503082275, -5.678705215454102, -5.2446794509887695, -4.8106536865234375, -4.3766279220581055, -3.9426021575927734, -3.5085763931274414, -3.0745506286621094, -2.6405248641967773, -2.2064993381500244, -1.7724735736846924, -1.3384478092193604, -0.9044222831726074, -0.4703965187072754, -0.03637075424194336, 0.3976549506187439, 0.8316806554794312, 1.2657063007354736, 1.6997320652008057, 2.1337578296661377, 2.5677833557128906, 3.0018091201782227, 3.4358348846435547, 3.8698606491088867, 4.303886413574219, 4.737912178039551, 5.171937942504883, 5.605963706970215, 6.039988994598389, 6.474014759063721, 6.908041000366211, 7.342066764831543, 7.776092529296875, 8.210118293762207, 8.644144058227539, 9.078169822692871, 9.512195587158203, 9.946220397949219, 10.380247116088867, 10.8142728805542, 11.248298645019531, 11.682324409484863, 12.116350173950195, 12.550375938415527, 12.98440170288086, 13.418426513671875, 13.852452278137207, 14.286478042602539, 14.720503807067871, 15.154529571533203, 15.588555335998535, 16.022581100463867, 16.456605911254883, 16.89063262939453, 17.324657440185547, 17.758682250976562, 18.19270896911621, 18.626733779907227, 19.060760498046875, 19.49478530883789, 19.92881202697754, 20.362836837768555, 20.796863555908203]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 3.0, 6.0, 4.0, 10.0, 16.0, 15.0, 16.0, 24.0, 33.0, 46.0, 39.0, 35.0, 35.0, 35.0, 33.0, 47.0, 44.0, 39.0, 47.0, 50.0, 55.0, 46.0, 33.0, 31.0, 29.0, 37.0, 31.0, 36.0, 32.0, 24.0, 13.0, 17.0, 7.0, 11.0, 7.0, 4.0, 5.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.798887252807617, -6.553752422332764, -6.308617115020752, -6.063482284545898, -5.818346977233887, -5.573212146759033, -5.32807731628418, -5.082942008972168, -4.8378071784973145, -4.592672348022461, -4.347537040710449, -4.102402210235596, -3.857267141342163, -3.6121320724487305, -3.366997241973877, -3.1218621730804443, -2.8767271041870117, -2.631592035293579, -2.3864569664001465, -2.141322135925293, -1.8961870670318604, -1.6510519981384277, -1.4059170484542847, -1.1607820987701416, -0.915647029876709, -0.6705120205879211, -0.4253770112991333, -0.18024200201034546, 0.06489300727844238, 0.310028076171875, 0.5551630258560181, 0.8002979755401611, 1.0454330444335938, 1.2905681133270264, 1.5357030630111694, 1.7808380126953125, 2.025973081588745, 2.2711081504821777, 2.5162429809570312, 2.761378049850464, 3.0065131187438965, 3.251648187637329, 3.4967832565307617, 3.7419180870056152, 3.987053155899048, 4.2321882247924805, 4.477323055267334, 4.7224578857421875, 4.967593193054199, 5.212728023529053, 5.4578633308410645, 5.702998161315918, 5.94813346862793, 6.193268299102783, 6.438403129577637, 6.683538436889648, 6.928673267364502, 7.1738080978393555, 7.418943405151367, 7.664078235626221, 7.909213066101074, 8.154348373413086, 8.399483680725098, 8.644618034362793, 8.889753341674805]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 9.0, 6.0, 9.0, 16.0, 27.0, 42.0, 77.0, 106.0, 182.0, 267.0, 471.0, 800.0, 1531.0, 2796.0, 5459.0, 10795.0, 23141.0, 52855.0, 131360.0, 304760.0, 294359.0, 125284.0, 50382.0, 21973.0, 10445.0, 5163.0, 2746.0, 1502.0, 803.0, 448.0, 280.0, 176.0, 97.0, 56.0, 53.0, 30.0, 15.0, 9.0, 10.0, 7.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.154296875, -1.1144561767578125, -1.074615478515625, -1.0347747802734375, -0.99493408203125, -0.9550933837890625, -0.915252685546875, -0.8754119873046875, -0.8355712890625, -0.7957305908203125, -0.755889892578125, -0.7160491943359375, -0.67620849609375, -0.6363677978515625, -0.596527099609375, -0.5566864013671875, -0.516845703125, -0.4770050048828125, -0.437164306640625, -0.3973236083984375, -0.35748291015625, -0.3176422119140625, -0.277801513671875, -0.2379608154296875, -0.1981201171875, -0.1582794189453125, -0.118438720703125, -0.0785980224609375, -0.03875732421875, 0.0010833740234375, 0.040924072265625, 0.0807647705078125, 0.12060546875, 0.1604461669921875, 0.200286865234375, 0.2401275634765625, 0.27996826171875, 0.3198089599609375, 0.359649658203125, 0.3994903564453125, 0.4393310546875, 0.4791717529296875, 0.519012451171875, 0.5588531494140625, 0.59869384765625, 0.6385345458984375, 0.678375244140625, 0.7182159423828125, 0.758056640625, 0.7978973388671875, 0.837738037109375, 0.8775787353515625, 0.91741943359375, 0.9572601318359375, 0.997100830078125, 1.0369415283203125, 1.0767822265625, 1.1166229248046875, 1.156463623046875, 1.1963043212890625, 1.23614501953125, 1.2759857177734375, 1.315826416015625, 1.3556671142578125, 1.3955078125]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 5.0, 6.0, 6.0, 8.0, 9.0, 13.0, 22.0, 29.0, 20.0, 35.0, 37.0, 59.0, 57.0, 40.0, 60.0, 56.0, 56.0, 67.0, 52.0, 50.0, 55.0, 42.0, 35.0, 42.0, 32.0, 27.0, 20.0, 16.0, 10.0, 9.0, 10.0, 9.0, 2.0, 6.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.935546875, -0.9017791748046875, -0.868011474609375, -0.8342437744140625, -0.80047607421875, -0.7667083740234375, -0.732940673828125, -0.6991729736328125, -0.6654052734375, -0.6316375732421875, -0.597869873046875, -0.5641021728515625, -0.53033447265625, -0.4965667724609375, -0.462799072265625, -0.4290313720703125, -0.395263671875, -0.3614959716796875, -0.327728271484375, -0.2939605712890625, -0.26019287109375, -0.2264251708984375, -0.192657470703125, -0.1588897705078125, -0.1251220703125, -0.0913543701171875, -0.057586669921875, -0.0238189697265625, 0.00994873046875, 0.0437164306640625, 0.077484130859375, 0.1112518310546875, 0.14501953125, 0.1787872314453125, 0.212554931640625, 0.2463226318359375, 0.28009033203125, 0.3138580322265625, 0.347625732421875, 0.3813934326171875, 0.4151611328125, 0.4489288330078125, 0.482696533203125, 0.5164642333984375, 0.55023193359375, 0.5839996337890625, 0.617767333984375, 0.6515350341796875, 0.685302734375, 0.7190704345703125, 0.752838134765625, 0.7866058349609375, 0.82037353515625, 0.8541412353515625, 0.887908935546875, 0.9216766357421875, 0.9554443359375, 0.9892120361328125, 1.022979736328125, 1.0567474365234375, 1.09051513671875, 1.1242828369140625, 1.158050537109375, 1.1918182373046875, 1.2255859375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 3.0, 2.0, 12.0, 8.0, 14.0, 15.0, 17.0, 27.0, 34.0, 51.0, 74.0, 78.0, 106.0, 132.0, 212.0, 298.0, 418.0, 629.0, 968.0, 1907.0, 4633.0, 18695.0, 123896.0, 756737.0, 113111.0, 17126.0, 4498.0, 1830.0, 957.0, 649.0, 377.0, 285.0, 199.0, 134.0, 99.0, 79.0, 66.0, 52.0, 32.0, 36.0, 17.0, 15.0, 7.0, 5.0, 11.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.236328125, -2.165283203125, -2.09423828125, -2.023193359375, -1.9521484375, -1.881103515625, -1.81005859375, -1.739013671875, -1.66796875, -1.596923828125, -1.52587890625, -1.454833984375, -1.3837890625, -1.312744140625, -1.24169921875, -1.170654296875, -1.099609375, -1.028564453125, -0.95751953125, -0.886474609375, -0.8154296875, -0.744384765625, -0.67333984375, -0.602294921875, -0.53125, -0.460205078125, -0.38916015625, -0.318115234375, -0.2470703125, -0.176025390625, -0.10498046875, -0.033935546875, 0.037109375, 0.108154296875, 0.17919921875, 0.250244140625, 0.3212890625, 0.392333984375, 0.46337890625, 0.534423828125, 0.60546875, 0.676513671875, 0.74755859375, 0.818603515625, 0.8896484375, 0.960693359375, 1.03173828125, 1.102783203125, 1.173828125, 1.244873046875, 1.31591796875, 1.386962890625, 1.4580078125, 1.529052734375, 1.60009765625, 1.671142578125, 1.7421875, 1.813232421875, 1.88427734375, 1.955322265625, 2.0263671875, 2.097412109375, 2.16845703125, 2.239501953125, 2.310546875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 3.0, 2.0, 4.0, 3.0, 10.0, 10.0, 13.0, 12.0, 13.0, 14.0, 24.0, 26.0, 32.0, 32.0, 32.0, 46.0, 43.0, 44.0, 56.0, 45.0, 63.0, 62.0, 53.0, 51.0, 53.0, 41.0, 33.0, 21.0, 30.0, 27.0, 20.0, 17.0, 10.0, 11.0, 16.0, 7.0, 6.0, 4.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.1796875, -3.078155517578125, -2.97662353515625, -2.875091552734375, -2.7735595703125, -2.672027587890625, -2.57049560546875, -2.468963623046875, -2.367431640625, -2.265899658203125, -2.16436767578125, -2.062835693359375, -1.9613037109375, -1.859771728515625, -1.75823974609375, -1.656707763671875, -1.55517578125, -1.453643798828125, -1.35211181640625, -1.250579833984375, -1.1490478515625, -1.047515869140625, -0.94598388671875, -0.844451904296875, -0.742919921875, -0.641387939453125, -0.53985595703125, -0.438323974609375, -0.3367919921875, -0.235260009765625, -0.13372802734375, -0.032196044921875, 0.0693359375, 0.170867919921875, 0.27239990234375, 0.373931884765625, 0.4754638671875, 0.576995849609375, 0.67852783203125, 0.780059814453125, 0.881591796875, 0.983123779296875, 1.08465576171875, 1.186187744140625, 1.2877197265625, 1.389251708984375, 1.49078369140625, 1.592315673828125, 1.69384765625, 1.795379638671875, 1.89691162109375, 1.998443603515625, 2.0999755859375, 2.201507568359375, 2.30303955078125, 2.404571533203125, 2.506103515625, 2.607635498046875, 2.70916748046875, 2.810699462890625, 2.9122314453125, 3.013763427734375, 3.11529541015625, 3.216827392578125, 3.318359375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 4.0, 4.0, 5.0, 8.0, 7.0, 8.0, 21.0, 43.0, 30.0, 64.0, 109.0, 147.0, 286.0, 522.0, 1136.0, 2931.0, 9559.0, 45292.0, 308668.0, 610829.0, 52413.0, 10858.0, 3146.0, 1145.0, 560.0, 302.0, 163.0, 95.0, 61.0, 50.0, 28.0, 22.0, 10.0, 6.0, 5.0, 7.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.492431640625, -0.4754753112792969, -0.45851898193359375, -0.4415626525878906, -0.4246063232421875, -0.4076499938964844, -0.39069366455078125, -0.3737373352050781, -0.356781005859375, -0.3398246765136719, -0.32286834716796875, -0.3059120178222656, -0.2889556884765625, -0.2719993591308594, -0.25504302978515625, -0.23808670043945312, -0.22113037109375, -0.20417404174804688, -0.18721771240234375, -0.17026138305664062, -0.1533050537109375, -0.13634872436523438, -0.11939239501953125, -0.10243606567382812, -0.085479736328125, -0.06852340698242188, -0.05156707763671875, -0.034610748291015625, -0.0176544189453125, -0.000698089599609375, 0.01625823974609375, 0.033214569091796875, 0.0501708984375, 0.06712722778320312, 0.08408355712890625, 0.10103988647460938, 0.1179962158203125, 0.13495254516601562, 0.15190887451171875, 0.16886520385742188, 0.185821533203125, 0.20277786254882812, 0.21973419189453125, 0.23669052124023438, 0.2536468505859375, 0.2706031799316406, 0.28755950927734375, 0.3045158386230469, 0.32147216796875, 0.3384284973144531, 0.35538482666015625, 0.3723411560058594, 0.3892974853515625, 0.4062538146972656, 0.42321014404296875, 0.4401664733886719, 0.457122802734375, 0.4740791320800781, 0.49103546142578125, 0.5079917907714844, 0.5249481201171875, 0.5419044494628906, 0.5588607788085938, 0.5758171081542969, 0.5927734375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 3.0, 5.0, 3.0, 7.0, 7.0, 9.0, 12.0, 11.0, 18.0, 22.0, 24.0, 27.0, 29.0, 44.0, 74.0, 69.0, 77.0, 82.0, 88.0, 82.0, 66.0, 46.0, 38.0, 20.0, 29.0, 18.0, 24.0, 16.0, 9.0, 9.0, 4.0, 8.0, 6.0, 4.0, 3.0, 1.0, 7.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001481771469116211, -0.00014331750571727753, -0.00013845786452293396, -0.0001335982233285904, -0.00012873858213424683, -0.00012387894093990326, -0.00011901929974555969, -0.00011415965855121613, -0.00010930001735687256, -0.00010444037616252899, -9.958073496818542e-05, -9.472109377384186e-05, -8.986145257949829e-05, -8.500181138515472e-05, -8.014217019081116e-05, -7.528252899646759e-05, -7.042288780212402e-05, -6.556324660778046e-05, -6.070360541343689e-05, -5.584396421909332e-05, -5.0984323024749756e-05, -4.612468183040619e-05, -4.126504063606262e-05, -3.6405399441719055e-05, -3.154575824737549e-05, -2.668611705303192e-05, -2.1826475858688354e-05, -1.6966834664344788e-05, -1.210719347000122e-05, -7.247552275657654e-06, -2.387911081314087e-06, 2.47173011302948e-06, 7.331371307373047e-06, 1.2191012501716614e-05, 1.705065369606018e-05, 2.1910294890403748e-05, 2.6769936084747314e-05, 3.162957727909088e-05, 3.648921847343445e-05, 4.1348859667778015e-05, 4.620850086212158e-05, 5.106814205646515e-05, 5.5927783250808716e-05, 6.078742444515228e-05, 6.564706563949585e-05, 7.050670683383942e-05, 7.536634802818298e-05, 8.022598922252655e-05, 8.508563041687012e-05, 8.994527161121368e-05, 9.480491280555725e-05, 9.966455399990082e-05, 0.00010452419519424438, 0.00010938383638858795, 0.00011424347758293152, 0.00011910311877727509, 0.00012396275997161865, 0.00012882240116596222, 0.00013368204236030579, 0.00013854168355464935, 0.00014340132474899292, 0.0001482609659433365, 0.00015312060713768005, 0.00015798024833202362, 0.0001628398895263672]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 7.0, 9.0, 5.0, 16.0, 27.0, 26.0, 41.0, 49.0, 110.0, 146.0, 234.0, 382.0, 708.0, 1440.0, 3633.0, 12015.0, 55845.0, 604014.0, 305091.0, 48002.0, 10509.0, 3282.0, 1325.0, 629.0, 394.0, 206.0, 137.0, 83.0, 45.0, 46.0, 24.0, 18.0, 14.0, 12.0, 11.0, 9.0, 3.0, 2.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.55810546875, -0.5430030822753906, -0.5279006958007812, -0.5127983093261719, -0.4976959228515625, -0.4825935363769531, -0.46749114990234375, -0.4523887634277344, -0.437286376953125, -0.4221839904785156, -0.40708160400390625, -0.3919792175292969, -0.3768768310546875, -0.3617744445800781, -0.34667205810546875, -0.3315696716308594, -0.31646728515625, -0.3013648986816406, -0.28626251220703125, -0.2711601257324219, -0.2560577392578125, -0.24095535278320312, -0.22585296630859375, -0.21075057983398438, -0.195648193359375, -0.18054580688476562, -0.16544342041015625, -0.15034103393554688, -0.1352386474609375, -0.12013626098632812, -0.10503387451171875, -0.08993148803710938, -0.0748291015625, -0.059726715087890625, -0.04462432861328125, -0.029521942138671875, -0.0144195556640625, 0.000682830810546875, 0.01578521728515625, 0.030887603759765625, 0.045989990234375, 0.061092376708984375, 0.07619476318359375, 0.09129714965820312, 0.1063995361328125, 0.12150192260742188, 0.13660430908203125, 0.15170669555664062, 0.16680908203125, 0.18191146850585938, 0.19701385498046875, 0.21211624145507812, 0.2272186279296875, 0.24232101440429688, 0.25742340087890625, 0.2725257873535156, 0.287628173828125, 0.3027305603027344, 0.31783294677734375, 0.3329353332519531, 0.3480377197265625, 0.3631401062011719, 0.37824249267578125, 0.3933448791503906, 0.408447265625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 8.0, 7.0, 6.0, 15.0, 18.0, 19.0, 22.0, 25.0, 31.0, 28.0, 53.0, 65.0, 62.0, 88.0, 75.0, 82.0, 62.0, 45.0, 54.0, 44.0, 41.0, 29.0, 17.0, 17.0, 14.0, 13.0, 9.0, 9.0, 11.0, 8.0, 4.0, 8.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0], "bins": [-0.462158203125, -0.44886016845703125, -0.4355621337890625, -0.42226409912109375, -0.408966064453125, -0.39566802978515625, -0.3823699951171875, -0.36907196044921875, -0.35577392578125, -0.34247589111328125, -0.3291778564453125, -0.31587982177734375, -0.302581787109375, -0.28928375244140625, -0.2759857177734375, -0.26268768310546875, -0.2493896484375, -0.23609161376953125, -0.2227935791015625, -0.20949554443359375, -0.196197509765625, -0.18289947509765625, -0.1696014404296875, -0.15630340576171875, -0.14300537109375, -0.12970733642578125, -0.1164093017578125, -0.10311126708984375, -0.089813232421875, -0.07651519775390625, -0.0632171630859375, -0.04991912841796875, -0.03662109375, -0.02332305908203125, -0.0100250244140625, 0.00327301025390625, 0.016571044921875, 0.02986907958984375, 0.0431671142578125, 0.05646514892578125, 0.06976318359375, 0.08306121826171875, 0.0963592529296875, 0.10965728759765625, 0.122955322265625, 0.13625335693359375, 0.1495513916015625, 0.16284942626953125, 0.1761474609375, 0.18944549560546875, 0.2027435302734375, 0.21604156494140625, 0.229339599609375, 0.24263763427734375, 0.2559356689453125, 0.26923370361328125, 0.28253173828125, 0.29582977294921875, 0.3091278076171875, 0.32242584228515625, 0.335723876953125, 0.34902191162109375, 0.3623199462890625, 0.37561798095703125, 0.388916015625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 5.0, 0.0, 3.0, 2.0, 11.0, 17.0, 23.0, 29.0, 66.0, 96.0, 148.0, 333.0, 131.0, 61.0, 46.0, 16.0, 12.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-22.230846405029297, -21.75246238708496, -21.274078369140625, -20.79569435119629, -20.317310333251953, -19.838924407958984, -19.36054039001465, -18.882156372070312, -18.403772354125977, -17.92538833618164, -17.447004318237305, -16.96862030029297, -16.490234375, -16.011850357055664, -15.533466339111328, -15.055082321166992, -14.576698303222656, -14.09831428527832, -13.619930267333984, -13.141545295715332, -12.663161277770996, -12.18477725982666, -11.706392288208008, -11.228008270263672, -10.749624252319336, -10.271240234375, -9.792856216430664, -9.314471244812012, -8.836087226867676, -8.35770320892334, -7.879318714141846, -7.400934219360352, -6.922549247741699, -6.444165229797363, -5.965780735015869, -5.487396240234375, -5.009012222290039, -4.530628204345703, -4.052243709564209, -3.573859453201294, -3.095475196838379, -2.617090940475464, -2.138706684112549, -1.6603224277496338, -1.1819381713867188, -0.7035539150238037, -0.22516965866088867, 0.25321459770202637, 0.7315988540649414, 1.2099831104278564, 1.6883673667907715, 2.1667516231536865, 2.6451358795166016, 3.1235201358795166, 3.6019043922424316, 4.080288887023926, 4.558672904968262, 5.037056922912598, 5.515441417694092, 5.993825912475586, 6.472209930419922, 6.950593948364258, 7.428978443145752, 7.907362937927246, 8.385746955871582]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 5.0, 4.0, 3.0, 7.0, 11.0, 8.0, 12.0, 11.0, 14.0, 15.0, 21.0, 18.0, 21.0, 31.0, 39.0, 38.0, 31.0, 52.0, 145.0, 142.0, 66.0, 45.0, 39.0, 22.0, 31.0, 27.0, 28.0, 21.0, 16.0, 8.0, 9.0, 11.0, 10.0, 13.0, 5.0, 8.0, 5.0, 4.0, 1.0, 5.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-13.262158393859863, -12.884936332702637, -12.50771427154541, -12.130491256713867, -11.75326919555664, -11.376047134399414, -10.998825073242188, -10.621603012084961, -10.244380950927734, -9.867158889770508, -9.489936828613281, -9.112714767456055, -8.735491752624512, -8.358269691467285, -7.981047630310059, -7.603825569152832, -7.226602554321289, -6.8493804931640625, -6.472157955169678, -6.094935894012451, -5.717713356018066, -5.34049129486084, -4.963269233703613, -4.586047172546387, -4.208824634552002, -3.8316023349761963, -3.4543800354003906, -3.077157974243164, -2.6999356746673584, -2.3227133750915527, -1.9454913139343262, -1.5682690143585205, -1.1910476684570312, -0.8138254284858704, -0.4366031885147095, -0.05938100814819336, 0.3178412914276123, 0.695063591003418, 1.0722856521606445, 1.4495079517364502, 1.8267302513122559, 2.2039525508880615, 2.581174850463867, 2.9583969116210938, 3.3356192111968994, 3.712841510772705, 4.090063571929932, 4.467286109924316, 4.844508171081543, 5.2217302322387695, 5.598952770233154, 5.976174831390381, 6.353397369384766, 6.730619430541992, 7.107841491699219, 7.485063552856445, 7.86228609085083, 8.239508628845215, 8.616730690002441, 8.993952751159668, 9.371174812316895, 9.748397827148438, 10.125619888305664, 10.50284194946289, 10.880064010620117]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 11.0, 12.0, 11.0, 25.0, 38.0, 77.0, 108.0, 182.0, 287.0, 615.0, 1106.0, 2196.0, 5468.0, 18216.0, 92787.0, 529604.0, 1851096.0, 1328823.0, 291840.0, 51548.0, 12515.0, 3966.0, 1652.0, 957.0, 455.0, 285.0, 170.0, 86.0, 54.0, 34.0, 27.0, 7.0, 10.0, 9.0, 7.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.87109375, -0.83453369140625, -0.7979736328125, -0.76141357421875, -0.724853515625, -0.68829345703125, -0.6517333984375, -0.61517333984375, -0.57861328125, -0.54205322265625, -0.5054931640625, -0.46893310546875, -0.432373046875, -0.39581298828125, -0.3592529296875, -0.32269287109375, -0.2861328125, -0.24957275390625, -0.2130126953125, -0.17645263671875, -0.139892578125, -0.10333251953125, -0.0667724609375, -0.03021240234375, 0.00634765625, 0.04290771484375, 0.0794677734375, 0.11602783203125, 0.152587890625, 0.18914794921875, 0.2257080078125, 0.26226806640625, 0.298828125, 0.33538818359375, 0.3719482421875, 0.40850830078125, 0.445068359375, 0.48162841796875, 0.5181884765625, 0.55474853515625, 0.59130859375, 0.62786865234375, 0.6644287109375, 0.70098876953125, 0.737548828125, 0.77410888671875, 0.8106689453125, 0.84722900390625, 0.8837890625, 0.92034912109375, 0.9569091796875, 0.99346923828125, 1.030029296875, 1.06658935546875, 1.1031494140625, 1.13970947265625, 1.17626953125, 1.21282958984375, 1.2493896484375, 1.28594970703125, 1.322509765625, 1.35906982421875, 1.3956298828125, 1.43218994140625, 1.46875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 3.0, 3.0, 5.0, 3.0, 4.0, 13.0, 12.0, 27.0, 22.0, 26.0, 25.0, 26.0, 38.0, 36.0, 55.0, 39.0, 43.0, 40.0, 50.0, 75.0, 57.0, 48.0, 54.0, 41.0, 29.0, 44.0, 41.0, 29.0, 23.0, 19.0, 13.0, 9.0, 15.0, 7.0, 4.0, 10.0, 2.0, 2.0, 6.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.9443359375, -0.9166183471679688, -0.8889007568359375, -0.8611831665039062, -0.833465576171875, -0.8057479858398438, -0.7780303955078125, -0.7503128051757812, -0.72259521484375, -0.6948776245117188, -0.6671600341796875, -0.6394424438476562, -0.611724853515625, -0.5840072631835938, -0.5562896728515625, -0.5285720825195312, -0.5008544921875, -0.47313690185546875, -0.4454193115234375, -0.41770172119140625, -0.389984130859375, -0.36226654052734375, -0.3345489501953125, -0.30683135986328125, -0.27911376953125, -0.25139617919921875, -0.2236785888671875, -0.19596099853515625, -0.168243408203125, -0.14052581787109375, -0.1128082275390625, -0.08509063720703125, -0.057373046875, -0.02965545654296875, -0.0019378662109375, 0.02577972412109375, 0.053497314453125, 0.08121490478515625, 0.1089324951171875, 0.13665008544921875, 0.16436767578125, 0.19208526611328125, 0.2198028564453125, 0.24752044677734375, 0.275238037109375, 0.30295562744140625, 0.3306732177734375, 0.35839080810546875, 0.3861083984375, 0.41382598876953125, 0.4415435791015625, 0.46926116943359375, 0.496978759765625, 0.5246963500976562, 0.5524139404296875, 0.5801315307617188, 0.60784912109375, 0.6355667114257812, 0.6632843017578125, 0.6910018920898438, 0.718719482421875, 0.7464370727539062, 0.7741546630859375, 0.8018722534179688, 0.82958984375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 0.0, 5.0, 4.0, 6.0, 9.0, 14.0, 18.0, 22.0, 38.0, 48.0, 76.0, 130.0, 200.0, 394.0, 743.0, 1641.0, 4814.0, 33327.0, 3487256.0, 643389.0, 15830.0, 3496.0, 1349.0, 605.0, 347.0, 187.0, 108.0, 73.0, 52.0, 24.0, 15.0, 24.0, 14.0, 8.0, 5.0, 5.0, 3.0, 3.0, 0.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.998046875, -3.87628173828125, -3.7545166015625, -3.63275146484375, -3.510986328125, -3.38922119140625, -3.2674560546875, -3.14569091796875, -3.02392578125, -2.90216064453125, -2.7803955078125, -2.65863037109375, -2.536865234375, -2.41510009765625, -2.2933349609375, -2.17156982421875, -2.0498046875, -1.92803955078125, -1.8062744140625, -1.68450927734375, -1.562744140625, -1.44097900390625, -1.3192138671875, -1.19744873046875, -1.07568359375, -0.95391845703125, -0.8321533203125, -0.71038818359375, -0.588623046875, -0.46685791015625, -0.3450927734375, -0.22332763671875, -0.1015625, 0.02020263671875, 0.1419677734375, 0.26373291015625, 0.385498046875, 0.50726318359375, 0.6290283203125, 0.75079345703125, 0.87255859375, 0.99432373046875, 1.1160888671875, 1.23785400390625, 1.359619140625, 1.48138427734375, 1.6031494140625, 1.72491455078125, 1.8466796875, 1.96844482421875, 2.0902099609375, 2.21197509765625, 2.333740234375, 2.45550537109375, 2.5772705078125, 2.69903564453125, 2.82080078125, 2.94256591796875, 3.0643310546875, 3.18609619140625, 3.307861328125, 3.42962646484375, 3.5513916015625, 3.67315673828125, 3.794921875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 10.0, 6.0, 7.0, 5.0, 16.0, 14.0, 21.0, 36.0, 46.0, 73.0, 108.0, 146.0, 208.0, 328.0, 430.0, 545.0, 509.0, 400.0, 319.0, 225.0, 166.0, 124.0, 92.0, 55.0, 50.0, 29.0, 24.0, 25.0, 15.0, 14.0, 3.0, 8.0, 6.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.03125, -1.958160400390625, -1.88507080078125, -1.811981201171875, -1.7388916015625, -1.665802001953125, -1.59271240234375, -1.519622802734375, -1.446533203125, -1.373443603515625, -1.30035400390625, -1.227264404296875, -1.1541748046875, -1.081085205078125, -1.00799560546875, -0.934906005859375, -0.86181640625, -0.788726806640625, -0.71563720703125, -0.642547607421875, -0.5694580078125, -0.496368408203125, -0.42327880859375, -0.350189208984375, -0.277099609375, -0.204010009765625, -0.13092041015625, -0.057830810546875, 0.0152587890625, 0.088348388671875, 0.16143798828125, 0.234527587890625, 0.3076171875, 0.380706787109375, 0.45379638671875, 0.526885986328125, 0.5999755859375, 0.673065185546875, 0.74615478515625, 0.819244384765625, 0.892333984375, 0.965423583984375, 1.03851318359375, 1.111602783203125, 1.1846923828125, 1.257781982421875, 1.33087158203125, 1.403961181640625, 1.47705078125, 1.550140380859375, 1.62322998046875, 1.696319580078125, 1.7694091796875, 1.842498779296875, 1.91558837890625, 1.988677978515625, 2.061767578125, 2.134857177734375, 2.20794677734375, 2.281036376953125, 2.3541259765625, 2.427215576171875, 2.50030517578125, 2.573394775390625, 2.646484375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 4.0, 4.0, 2.0, 2.0, 8.0, 7.0, 22.0, 36.0, 66.0, 119.0, 232.0, 222.0, 147.0, 55.0, 34.0, 19.0, 12.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-27.069202423095703, -25.97530174255371, -24.88140106201172, -23.787500381469727, -22.693599700927734, -21.59969711303711, -20.505796432495117, -19.411895751953125, -18.317995071411133, -17.22409439086914, -16.13019371032715, -15.03629207611084, -13.942391395568848, -12.848490715026855, -11.754589080810547, -10.660688400268555, -9.566787719726562, -8.47288703918457, -7.37898588180542, -6.2850847244262695, -5.191184043884277, -4.097283363342285, -3.0033822059631348, -1.9094810485839844, -0.8155803680419922, 0.2783205509185791, 1.3722214698791504, 2.4661223888397217, 3.560023307800293, 4.653923988342285, 5.7478251457214355, 6.841726303100586, 7.935626983642578, 9.02952766418457, 10.123428344726562, 11.217329978942871, 12.311230659484863, 13.405131340026855, 14.499032974243164, 15.592933654785156, 16.68683433532715, 17.78073501586914, 18.874635696411133, 19.968536376953125, 21.06243896484375, 22.15633773803711, 23.250240325927734, 24.344141006469727, 25.43804168701172, 26.53194236755371, 27.625843048095703, 28.719743728637695, 29.813644409179688, 30.907546997070312, 32.00144577026367, 33.0953483581543, 34.189247131347656, 35.28314971923828, 36.37704849243164, 37.470951080322266, 38.564849853515625, 39.65875244140625, 40.75265121459961, 41.846553802490234, 42.94045639038086]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 2.0, 4.0, 2.0, 4.0, 6.0, 12.0, 7.0, 17.0, 17.0, 8.0, 18.0, 25.0, 15.0, 24.0, 21.0, 36.0, 32.0, 40.0, 36.0, 45.0, 42.0, 54.0, 58.0, 61.0, 53.0, 49.0, 39.0, 35.0, 27.0, 23.0, 36.0, 24.0, 29.0, 15.0, 13.0, 18.0, 12.0, 17.0, 4.0, 7.0, 1.0, 3.0, 2.0, 5.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-15.017311096191406, -14.561007499694824, -14.104703903198242, -13.648401260375977, -13.192097663879395, -12.735794067382812, -12.27949047088623, -11.823186874389648, -11.366883277893066, -10.910579681396484, -10.454276084899902, -9.99797248840332, -9.541669845581055, -9.085366249084473, -8.62906265258789, -8.172759056091309, -7.716455936431885, -7.260152339935303, -6.803849220275879, -6.347545623779297, -5.891242027282715, -5.434938430786133, -4.978635311126709, -4.522331714630127, -4.066028594970703, -3.6097252368927, -3.153421640396118, -2.6971182823181152, -2.240814685821533, -1.7845113277435303, -1.3282079696655273, -0.8719043731689453, -0.4156007766723633, 0.04070267081260681, 0.4970061182975769, 0.9533095359802246, 1.409613013267517, 1.8659164905548096, 2.3222198486328125, 2.7785234451293945, 3.2348268032073975, 3.6911301612854004, 4.147433757781982, 4.603736877441406, 5.060040473937988, 5.51634407043457, 5.972647666931152, 6.428951263427734, 6.885254383087158, 7.34155797958374, 7.797861099243164, 8.254164695739746, 8.710468292236328, 9.16677188873291, 9.623075485229492, 10.079378128051758, 10.53568172454834, 10.991985321044922, 11.448288917541504, 11.904592514038086, 12.360895156860352, 12.817198753356934, 13.273502349853516, 13.729805946350098, 14.18610954284668]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 4.0, 5.0, 7.0, 5.0, 12.0, 11.0, 16.0, 11.0, 36.0, 49.0, 68.0, 110.0, 177.0, 266.0, 442.0, 849.0, 1585.0, 3361.0, 7566.0, 20300.0, 65552.0, 288216.0, 511094.0, 100767.0, 28941.0, 10323.0, 4307.0, 1975.0, 1088.0, 530.0, 327.0, 195.0, 124.0, 78.0, 40.0, 35.0, 19.0, 22.0, 9.0, 7.0, 6.0, 4.0, 5.0, 3.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5224609375, -1.47198486328125, -1.4215087890625, -1.37103271484375, -1.320556640625, -1.27008056640625, -1.2196044921875, -1.16912841796875, -1.11865234375, -1.06817626953125, -1.0177001953125, -0.96722412109375, -0.916748046875, -0.86627197265625, -0.8157958984375, -0.76531982421875, -0.71484375, -0.66436767578125, -0.6138916015625, -0.56341552734375, -0.512939453125, -0.46246337890625, -0.4119873046875, -0.36151123046875, -0.31103515625, -0.26055908203125, -0.2100830078125, -0.15960693359375, -0.109130859375, -0.05865478515625, -0.0081787109375, 0.04229736328125, 0.0927734375, 0.14324951171875, 0.1937255859375, 0.24420166015625, 0.294677734375, 0.34515380859375, 0.3956298828125, 0.44610595703125, 0.49658203125, 0.54705810546875, 0.5975341796875, 0.64801025390625, 0.698486328125, 0.74896240234375, 0.7994384765625, 0.84991455078125, 0.900390625, 0.95086669921875, 1.0013427734375, 1.05181884765625, 1.102294921875, 1.15277099609375, 1.2032470703125, 1.25372314453125, 1.30419921875, 1.35467529296875, 1.4051513671875, 1.45562744140625, 1.506103515625, 1.55657958984375, 1.6070556640625, 1.65753173828125, 1.7080078125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 2.0, 2.0, 4.0, 6.0, 5.0, 12.0, 17.0, 11.0, 33.0, 32.0, 36.0, 41.0, 47.0, 52.0, 65.0, 56.0, 71.0, 74.0, 70.0, 64.0, 74.0, 49.0, 36.0, 37.0, 17.0, 27.0, 16.0, 9.0, 13.0, 7.0, 8.0, 5.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.2607421875, -1.2172393798828125, -1.173736572265625, -1.1302337646484375, -1.08673095703125, -1.0432281494140625, -0.999725341796875, -0.9562225341796875, -0.9127197265625, -0.8692169189453125, -0.825714111328125, -0.7822113037109375, -0.73870849609375, -0.6952056884765625, -0.651702880859375, -0.6082000732421875, -0.564697265625, -0.5211944580078125, -0.477691650390625, -0.4341888427734375, -0.39068603515625, -0.3471832275390625, -0.303680419921875, -0.2601776123046875, -0.2166748046875, -0.1731719970703125, -0.129669189453125, -0.0861663818359375, -0.04266357421875, 0.0008392333984375, 0.044342041015625, 0.0878448486328125, 0.13134765625, 0.1748504638671875, 0.218353271484375, 0.2618560791015625, 0.30535888671875, 0.3488616943359375, 0.392364501953125, 0.4358673095703125, 0.4793701171875, 0.5228729248046875, 0.566375732421875, 0.6098785400390625, 0.65338134765625, 0.6968841552734375, 0.740386962890625, 0.7838897705078125, 0.827392578125, 0.8708953857421875, 0.914398193359375, 0.9579010009765625, 1.00140380859375, 1.0449066162109375, 1.088409423828125, 1.1319122314453125, 1.1754150390625, 1.2189178466796875, 1.262420654296875, 1.3059234619140625, 1.34942626953125, 1.3929290771484375, 1.436431884765625, 1.4799346923828125, 1.5234375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 2.0, 4.0, 9.0, 7.0, 16.0, 25.0, 22.0, 37.0, 48.0, 68.0, 118.0, 199.0, 320.0, 615.0, 1335.0, 4374.0, 30102.0, 887942.0, 110053.0, 9457.0, 2136.0, 745.0, 414.0, 231.0, 91.0, 73.0, 35.0, 28.0, 22.0, 16.0, 3.0, 2.0, 1.0, 5.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.47265625, -2.383514404296875, -2.29437255859375, -2.205230712890625, -2.1160888671875, -2.026947021484375, -1.93780517578125, -1.848663330078125, -1.759521484375, -1.670379638671875, -1.58123779296875, -1.492095947265625, -1.4029541015625, -1.313812255859375, -1.22467041015625, -1.135528564453125, -1.04638671875, -0.957244873046875, -0.86810302734375, -0.778961181640625, -0.6898193359375, -0.600677490234375, -0.51153564453125, -0.422393798828125, -0.333251953125, -0.244110107421875, -0.15496826171875, -0.065826416015625, 0.0233154296875, 0.112457275390625, 0.20159912109375, 0.290740966796875, 0.3798828125, 0.469024658203125, 0.55816650390625, 0.647308349609375, 0.7364501953125, 0.825592041015625, 0.91473388671875, 1.003875732421875, 1.093017578125, 1.182159423828125, 1.27130126953125, 1.360443115234375, 1.4495849609375, 1.538726806640625, 1.62786865234375, 1.717010498046875, 1.80615234375, 1.895294189453125, 1.98443603515625, 2.073577880859375, 2.1627197265625, 2.251861572265625, 2.34100341796875, 2.430145263671875, 2.519287109375, 2.608428955078125, 2.69757080078125, 2.786712646484375, 2.8758544921875, 2.964996337890625, 3.05413818359375, 3.143280029296875, 3.232421875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 0.0, 2.0, 6.0, 3.0, 10.0, 5.0, 13.0, 14.0, 21.0, 22.0, 16.0, 19.0, 27.0, 21.0, 34.0, 40.0, 44.0, 40.0, 65.0, 89.0, 69.0, 73.0, 73.0, 51.0, 49.0, 33.0, 25.0, 23.0, 22.0, 18.0, 22.0, 12.0, 9.0, 4.0, 9.0, 2.0, 6.0, 3.0, 1.0, 2.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.37890625, -4.252410888671875, -4.12591552734375, -3.999420166015625, -3.8729248046875, -3.746429443359375, -3.61993408203125, -3.493438720703125, -3.366943359375, -3.240447998046875, -3.11395263671875, -2.987457275390625, -2.8609619140625, -2.734466552734375, -2.60797119140625, -2.481475830078125, -2.35498046875, -2.228485107421875, -2.10198974609375, -1.975494384765625, -1.8489990234375, -1.722503662109375, -1.59600830078125, -1.469512939453125, -1.343017578125, -1.216522216796875, -1.09002685546875, -0.963531494140625, -0.8370361328125, -0.710540771484375, -0.58404541015625, -0.457550048828125, -0.3310546875, -0.204559326171875, -0.07806396484375, 0.048431396484375, 0.1749267578125, 0.301422119140625, 0.42791748046875, 0.554412841796875, 0.680908203125, 0.807403564453125, 0.93389892578125, 1.060394287109375, 1.1868896484375, 1.313385009765625, 1.43988037109375, 1.566375732421875, 1.69287109375, 1.819366455078125, 1.94586181640625, 2.072357177734375, 2.1988525390625, 2.325347900390625, 2.45184326171875, 2.578338623046875, 2.704833984375, 2.831329345703125, 2.95782470703125, 3.084320068359375, 3.2108154296875, 3.337310791015625, 3.46380615234375, 3.590301513671875, 3.716796875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 3.0, 1.0, 5.0, 2.0, 3.0, 5.0, 11.0, 6.0, 8.0, 15.0, 19.0, 29.0, 38.0, 71.0, 140.0, 292.0, 562.0, 1562.0, 5998.0, 37034.0, 911672.0, 77768.0, 9427.0, 2391.0, 736.0, 328.0, 168.0, 91.0, 62.0, 39.0, 13.0, 10.0, 7.0, 13.0, 7.0, 8.0, 2.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.67333984375, -0.6533279418945312, -0.6333160400390625, -0.6133041381835938, -0.593292236328125, -0.5732803344726562, -0.5532684326171875, -0.5332565307617188, -0.51324462890625, -0.49323272705078125, -0.4732208251953125, -0.45320892333984375, -0.433197021484375, -0.41318511962890625, -0.3931732177734375, -0.37316131591796875, -0.3531494140625, -0.33313751220703125, -0.3131256103515625, -0.29311370849609375, -0.273101806640625, -0.25308990478515625, -0.2330780029296875, -0.21306610107421875, -0.19305419921875, -0.17304229736328125, -0.1530303955078125, -0.13301849365234375, -0.113006591796875, -0.09299468994140625, -0.0729827880859375, -0.05297088623046875, -0.032958984375, -0.01294708251953125, 0.0070648193359375, 0.02707672119140625, 0.047088623046875, 0.06710052490234375, 0.0871124267578125, 0.10712432861328125, 0.12713623046875, 0.14714813232421875, 0.1671600341796875, 0.18717193603515625, 0.207183837890625, 0.22719573974609375, 0.2472076416015625, 0.26721954345703125, 0.2872314453125, 0.30724334716796875, 0.3272552490234375, 0.34726715087890625, 0.367279052734375, 0.38729095458984375, 0.4073028564453125, 0.42731475830078125, 0.44732666015625, 0.46733856201171875, 0.4873504638671875, 0.5073623657226562, 0.527374267578125, 0.5473861694335938, 0.5673980712890625, 0.5874099731445312, 0.607421875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 7.0, 4.0, 4.0, 5.0, 6.0, 5.0, 11.0, 13.0, 7.0, 14.0, 12.0, 20.0, 31.0, 28.0, 53.0, 87.0, 88.0, 100.0, 101.0, 103.0, 70.0, 39.0, 37.0, 23.0, 22.0, 20.0, 19.0, 8.0, 11.0, 8.0, 7.0, 6.0, 4.0, 10.0, 2.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.00012183189392089844, -0.00011773966252803802, -0.00011364743113517761, -0.0001095551997423172, -0.00010546296834945679, -0.00010137073695659637, -9.727850556373596e-05, -9.318627417087555e-05, -8.909404277801514e-05, -8.500181138515472e-05, -8.090957999229431e-05, -7.68173485994339e-05, -7.272511720657349e-05, -6.863288581371307e-05, -6.454065442085266e-05, -6.044842302799225e-05, -5.6356191635131836e-05, -5.226396024227142e-05, -4.817172884941101e-05, -4.40794974565506e-05, -3.9987266063690186e-05, -3.589503467082977e-05, -3.180280327796936e-05, -2.7710571885108948e-05, -2.3618340492248535e-05, -1.9526109099388123e-05, -1.543387770652771e-05, -1.1341646313667297e-05, -7.249414920806885e-06, -3.157183527946472e-06, 9.350478649139404e-07, 5.027279257774353e-06, 9.119510650634766e-06, 1.3211742043495178e-05, 1.730397343635559e-05, 2.1396204829216003e-05, 2.5488436222076416e-05, 2.958066761493683e-05, 3.367289900779724e-05, 3.7765130400657654e-05, 4.1857361793518066e-05, 4.594959318637848e-05, 5.004182457923889e-05, 5.4134055972099304e-05, 5.822628736495972e-05, 6.231851875782013e-05, 6.641075015068054e-05, 7.050298154354095e-05, 7.459521293640137e-05, 7.868744432926178e-05, 8.277967572212219e-05, 8.68719071149826e-05, 9.096413850784302e-05, 9.505636990070343e-05, 9.914860129356384e-05, 0.00010324083268642426, 0.00010733306407928467, 0.00011142529547214508, 0.00011551752686500549, 0.0001196097582578659, 0.00012370198965072632, 0.00012779422104358673, 0.00013188645243644714, 0.00013597868382930756, 0.00014007091522216797]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 4.0, 5.0, 10.0, 16.0, 14.0, 33.0, 46.0, 80.0, 150.0, 264.0, 533.0, 1228.0, 3337.0, 12206.0, 72257.0, 874306.0, 66706.0, 11647.0, 3323.0, 1288.0, 488.0, 245.0, 146.0, 99.0, 48.0, 23.0, 9.0, 11.0, 9.0, 7.0, 3.0, 2.0, 2.0, 3.0, 5.0, 1.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.397216796875, -0.384185791015625, -0.37115478515625, -0.358123779296875, -0.3450927734375, -0.332061767578125, -0.31903076171875, -0.305999755859375, -0.29296875, -0.279937744140625, -0.26690673828125, -0.253875732421875, -0.2408447265625, -0.227813720703125, -0.21478271484375, -0.201751708984375, -0.188720703125, -0.175689697265625, -0.16265869140625, -0.149627685546875, -0.1365966796875, -0.123565673828125, -0.11053466796875, -0.097503662109375, -0.08447265625, -0.071441650390625, -0.05841064453125, -0.045379638671875, -0.0323486328125, -0.019317626953125, -0.00628662109375, 0.006744384765625, 0.019775390625, 0.032806396484375, 0.04583740234375, 0.058868408203125, 0.0718994140625, 0.084930419921875, 0.09796142578125, 0.110992431640625, 0.1240234375, 0.137054443359375, 0.15008544921875, 0.163116455078125, 0.1761474609375, 0.189178466796875, 0.20220947265625, 0.215240478515625, 0.228271484375, 0.241302490234375, 0.25433349609375, 0.267364501953125, 0.2803955078125, 0.293426513671875, 0.30645751953125, 0.319488525390625, 0.33251953125, 0.345550537109375, 0.35858154296875, 0.371612548828125, 0.3846435546875, 0.397674560546875, 0.41070556640625, 0.423736572265625, 0.436767578125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 1.0, 2.0, 0.0, 4.0, 5.0, 3.0, 4.0, 6.0, 7.0, 8.0, 14.0, 15.0, 20.0, 20.0, 37.0, 38.0, 59.0, 62.0, 74.0, 114.0, 107.0, 85.0, 72.0, 62.0, 38.0, 34.0, 23.0, 19.0, 15.0, 13.0, 12.0, 5.0, 7.0, 2.0, 8.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.36083984375, -0.3484230041503906, -0.33600616455078125, -0.3235893249511719, -0.3111724853515625, -0.2987556457519531, -0.28633880615234375, -0.2739219665527344, -0.261505126953125, -0.24908828735351562, -0.23667144775390625, -0.22425460815429688, -0.2118377685546875, -0.19942092895507812, -0.18700408935546875, -0.17458724975585938, -0.16217041015625, -0.14975357055664062, -0.13733673095703125, -0.12491989135742188, -0.1125030517578125, -0.10008621215820312, -0.08766937255859375, -0.07525253295898438, -0.062835693359375, -0.050418853759765625, -0.03800201416015625, -0.025585174560546875, -0.0131683349609375, -0.000751495361328125, 0.01166534423828125, 0.024082183837890625, 0.0364990234375, 0.048915863037109375, 0.06133270263671875, 0.07374954223632812, 0.0861663818359375, 0.09858322143554688, 0.11100006103515625, 0.12341690063476562, 0.135833740234375, 0.14825057983398438, 0.16066741943359375, 0.17308425903320312, 0.1855010986328125, 0.19791793823242188, 0.21033477783203125, 0.22275161743164062, 0.23516845703125, 0.24758529663085938, 0.26000213623046875, 0.2724189758300781, 0.2848358154296875, 0.2972526550292969, 0.30966949462890625, 0.3220863342285156, 0.334503173828125, 0.3469200134277344, 0.35933685302734375, 0.3717536926269531, 0.3841705322265625, 0.3965873718261719, 0.40900421142578125, 0.4214210510253906, 0.433837890625]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 7.0, 5.0, 37.0, 78.0, 378.0, 415.0, 71.0, 14.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.805763244628906, -48.72344970703125, -47.64113235473633, -46.55881881713867, -45.47650146484375, -44.394187927246094, -43.31187057495117, -42.229557037353516, -41.147239685058594, -40.06492614746094, -38.982608795166016, -37.90029525756836, -36.81797790527344, -35.73566436767578, -34.65334701538086, -33.5710334777832, -32.48871612548828, -31.406400680541992, -30.324085235595703, -29.241769790649414, -28.159454345703125, -27.077138900756836, -25.994823455810547, -24.91250991821289, -23.830196380615234, -22.747880935668945, -21.665565490722656, -20.583250045776367, -19.500934600830078, -18.41861915588379, -17.3363037109375, -16.253990173339844, -15.171670913696289, -14.08935546875, -13.007040023803711, -11.924724578857422, -10.842409133911133, -9.760093688964844, -8.677779197692871, -7.595463752746582, -6.513148307800293, -5.430832862854004, -4.348517417907715, -3.266202449798584, -2.183887004852295, -1.1015715599060059, -0.019256591796875, 1.063058853149414, 2.145374298095703, 3.227689743041992, 4.310005187988281, 5.392320156097412, 6.474635601043701, 7.55695104598999, 8.639266014099121, 9.72158145904541, 10.8038969039917, 11.886212348937988, 12.968527793884277, 14.05084228515625, 15.133157730102539, 16.215473175048828, 17.297788619995117, 18.380104064941406, 19.462419509887695]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 2.0, 5.0, 0.0, 2.0, 7.0, 7.0, 8.0, 6.0, 3.0, 15.0, 18.0, 20.0, 12.0, 15.0, 12.0, 17.0, 18.0, 19.0, 17.0, 25.0, 33.0, 126.0, 207.0, 133.0, 37.0, 23.0, 31.0, 24.0, 14.0, 20.0, 10.0, 16.0, 15.0, 13.0, 5.0, 9.0, 6.0, 14.0, 9.0, 4.0, 5.0, 5.0, 6.0, 2.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.094806671142578, -8.814618110656738, -8.534429550170898, -8.254241943359375, -7.974053382873535, -7.693864822387695, -7.4136762619018555, -7.133487701416016, -6.853299617767334, -6.573111057281494, -6.2929229736328125, -6.012734413146973, -5.732545852661133, -5.452357769012451, -5.172169208526611, -4.89198112487793, -4.61179256439209, -4.33160400390625, -4.051415920257568, -3.7712273597717285, -3.4910390377044678, -3.210850715637207, -2.930662155151367, -2.6504738330841064, -2.3702855110168457, -2.090097188949585, -1.8099087476730347, -1.5297203063964844, -1.2495319843292236, -0.9693436622619629, -0.6891552209854126, -0.4089667797088623, -0.12877845764160156, 0.15140992403030396, 0.4315983057022095, 0.711786687374115, 0.9919750690460205, 1.2721633911132812, 1.5523518323898315, 1.8325402736663818, 2.1127285957336426, 2.3929169178009033, 2.673105239868164, 2.953293800354004, 3.2334821224212646, 3.5136704444885254, 3.7938590049743652, 4.074047088623047, 4.354235649108887, 4.634424209594727, 4.914612293243408, 5.194800853729248, 5.47498893737793, 5.7551774978637695, 6.035366058349609, 6.315554618835449, 6.595742702484131, 6.875931262969971, 7.156119346618652, 7.436307907104492, 7.716496467590332, 7.996684551239014, 8.276872634887695, 8.557061195373535, 8.837249755859375]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 3.0, 6.0, 6.0, 13.0, 13.0, 22.0, 18.0, 17.0, 18.0, 29.0, 26.0, 27.0, 33.0, 41.0, 93.0, 237.0, 140.0, 52.0, 35.0, 36.0, 23.0, 21.0, 16.0, 16.0, 12.0, 9.0, 2.0, 6.0, 10.0, 5.0, 6.0, 4.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.90234375, -0.87091064453125, -0.8394775390625, -0.80804443359375, -0.776611328125, -0.74517822265625, -0.7137451171875, -0.68231201171875, -0.65087890625, -0.61944580078125, -0.5880126953125, -0.55657958984375, -0.525146484375, -0.49371337890625, -0.4622802734375, -0.43084716796875, -0.3994140625, -0.36798095703125, -0.3365478515625, -0.30511474609375, -0.273681640625, -0.24224853515625, -0.2108154296875, -0.17938232421875, -0.14794921875, -0.11651611328125, -0.0850830078125, -0.05364990234375, -0.022216796875, 0.00921630859375, 0.0406494140625, 0.07208251953125, 0.103515625, 0.13494873046875, 0.1663818359375, 0.19781494140625, 0.229248046875, 0.26068115234375, 0.2921142578125, 0.32354736328125, 0.35498046875, 0.38641357421875, 0.4178466796875, 0.44927978515625, 0.480712890625, 0.51214599609375, 0.5435791015625, 0.57501220703125, 0.6064453125, 0.63787841796875, 0.6693115234375, 0.70074462890625, 0.732177734375, 0.76361083984375, 0.7950439453125, 0.82647705078125, 0.85791015625, 0.88934326171875, 0.9207763671875, 0.95220947265625, 0.983642578125, 1.01507568359375, 1.0465087890625, 1.07794189453125, 1.109375]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 0.0, 7.0, 4.0, 7.0, 6.0, 15.0, 19.0, 25.0, 40.0, 97.0, 215.0, 858.0, 7478.0, 8368660.0, 9792.0, 930.0, 224.0, 91.0, 34.0, 24.0, 12.0, 24.0, 8.0, 7.0, 9.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-17.864316940307617, -17.375450134277344, -16.88658332824707, -16.397714614868164, -15.90884780883789, -15.419981002807617, -14.931114196777344, -14.44224739074707, -13.95337963104248, -13.464512825012207, -12.975645065307617, -12.486778259277344, -11.99791145324707, -11.50904369354248, -11.020176887512207, -10.531309127807617, -10.042442321777344, -9.55357551574707, -9.06470775604248, -8.575840950012207, -8.086973190307617, -7.598106384277344, -7.10923957824707, -6.620372295379639, -6.131505012512207, -5.642637729644775, -5.153770446777344, -4.66490364074707, -4.176036357879639, -3.687169075012207, -3.1983020305633545, -2.709434986114502, -2.2205677032470703, -1.7317005395889282, -1.2428333759307861, -0.753966212272644, -0.26509904861450195, 0.2237682342529297, 0.7126352787017822, 1.2015023231506348, 1.6903696060180664, 2.179236888885498, 2.6681039333343506, 3.156970977783203, 3.6458382606506348, 4.134705543518066, 4.62357234954834, 5.1124396324157715, 5.601306915283203, 6.090174198150635, 6.579041481018066, 7.06790828704834, 7.5567755699157715, 8.045642852783203, 8.534509658813477, 9.02337646484375, 9.51224422454834, 10.001111030578613, 10.489978790283203, 10.978845596313477, 11.46771240234375, 11.95658016204834, 12.445446968078613, 12.934314727783203, 13.423181533813477]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 5.0, 3.0, 4.0, 2.0, 2.0, 1.0, 6.0, 2.0, 3.0, 2.0, 7.0, 6.0, 3.0, 8.0, 0.0, 6.0, 7.0, 1.0, 6.0, 2.0, 0.0, 1.0, 5.0, 1.0, 0.0, 1.0, 8.0, 1.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.9409661293029785, -5.722023963928223, -5.503082275390625, -5.284140110015869, -5.065197944641113, -4.846256256103516, -4.62731409072876, -4.408371925354004, -4.189430236816406, -3.9704883098602295, -3.7515463829040527, -3.532604217529297, -3.31366229057312, -3.0947203636169434, -2.8757781982421875, -2.6568362712860107, -2.437894344329834, -2.2189524173736572, -2.0000104904174805, -1.7810683250427246, -1.5621263980865479, -1.343184471130371, -1.1242424249649048, -0.9053003787994385, -0.6863584518432617, -0.4674164652824402, -0.24847447872161865, -0.02953249216079712, 0.18940949440002441, 0.40835142135620117, 0.6272934675216675, 0.8462355136871338, 1.0651779174804688, 1.2841198444366455, 1.5030618906021118, 1.7220039367675781, 1.9409458637237549, 2.1598877906799316, 2.3788299560546875, 2.5977718830108643, 2.816713809967041, 3.0356557369232178, 3.2545976638793945, 3.4735398292541504, 3.692481756210327, 3.911423683166504, 4.13036584854126, 4.349308013916016, 4.568249702453613, 4.787191867828369, 5.006133556365967, 5.225075721740723, 5.44401741027832, 5.662959575653076, 5.881901741027832, 6.10084342956543, 6.3197855949401855, 6.538727760314941, 6.757669448852539, 6.976611614227295, 7.195553779602051, 7.414495468139648, 7.633437633514404, 7.85237979888916, 8.071321487426758]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 1.0, 6.0, 6.0, 8.0, 26.0, 27.0, 44.0, 44.0, 106.0, 131.0, 238.0, 472.0, 1226.0, 4297.0, 17810.0, 85839.0, 269715.0, 111618.0, 23823.0, 5862.0, 1620.0, 602.0, 288.0, 142.0, 90.0, 63.0, 42.0, 50.0, 22.0, 11.0, 12.0, 8.0, 11.0, 1.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.8203125, -8.5318603515625, -8.243408203125, -7.9549560546875, -7.66650390625, -7.3780517578125, -7.089599609375, -6.8011474609375, -6.5126953125, -6.2242431640625, -5.935791015625, -5.6473388671875, -5.35888671875, -5.0704345703125, -4.781982421875, -4.4935302734375, -4.205078125, -3.9166259765625, -3.628173828125, -3.3397216796875, -3.05126953125, -2.7628173828125, -2.474365234375, -2.1859130859375, -1.8974609375, -1.6090087890625, -1.320556640625, -1.0321044921875, -0.74365234375, -0.4552001953125, -0.166748046875, 0.1217041015625, 0.41015625, 0.6986083984375, 0.987060546875, 1.2755126953125, 1.56396484375, 1.8524169921875, 2.140869140625, 2.4293212890625, 2.7177734375, 3.0062255859375, 3.294677734375, 3.5831298828125, 3.87158203125, 4.1600341796875, 4.448486328125, 4.7369384765625, 5.025390625, 5.3138427734375, 5.602294921875, 5.8907470703125, 6.17919921875, 6.4676513671875, 6.756103515625, 7.0445556640625, 7.3330078125, 7.6214599609375, 7.909912109375, 8.1983642578125, 8.48681640625, 8.7752685546875, 9.063720703125, 9.3521728515625, 9.640625]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 7.0, 4.0, 11.0, 19.0, 17.0, 27.0, 25.0, 41.0, 56.0, 62.0, 73.0, 90.0, 89.0, 83.0, 80.0, 75.0, 65.0, 44.0, 35.0, 21.0, 28.0, 17.0, 6.0, 5.0, 11.0, 4.0, 2.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.455078125, -1.407073974609375, -1.35906982421875, -1.311065673828125, -1.2630615234375, -1.215057373046875, -1.16705322265625, -1.119049072265625, -1.071044921875, -1.023040771484375, -0.97503662109375, -0.927032470703125, -0.8790283203125, -0.831024169921875, -0.78302001953125, -0.735015869140625, -0.68701171875, -0.639007568359375, -0.59100341796875, -0.542999267578125, -0.4949951171875, -0.446990966796875, -0.39898681640625, -0.350982666015625, -0.302978515625, -0.254974365234375, -0.20697021484375, -0.158966064453125, -0.1109619140625, -0.062957763671875, -0.01495361328125, 0.033050537109375, 0.0810546875, 0.129058837890625, 0.17706298828125, 0.225067138671875, 0.2730712890625, 0.321075439453125, 0.36907958984375, 0.417083740234375, 0.465087890625, 0.513092041015625, 0.56109619140625, 0.609100341796875, 0.6571044921875, 0.705108642578125, 0.75311279296875, 0.801116943359375, 0.84912109375, 0.897125244140625, 0.94512939453125, 0.993133544921875, 1.0411376953125, 1.089141845703125, 1.13714599609375, 1.185150146484375, 1.233154296875, 1.281158447265625, 1.32916259765625, 1.377166748046875, 1.4251708984375, 1.473175048828125, 1.52117919921875, 1.569183349609375, 1.6171875]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 7.0, 9.0, 17.0, 99.0, 217.0, 88.0, 22.0, 11.0, 9.0, 10.0, 5.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.651233673095703, -11.055516242980957, -10.459798812866211, -9.864081382751465, -9.268363952636719, -8.672646522521973, -8.076929092407227, -7.481212139129639, -6.885494709014893, -6.2897772789001465, -5.6940598487854, -5.0983428955078125, -4.502625465393066, -3.906907796859741, -3.311190605163574, -2.715473175048828, -2.119755744934082, -1.524038314819336, -0.9283210039138794, -0.33260369300842285, 0.26311373710632324, 0.8588311672210693, 1.4545483589172363, 2.0502657890319824, 2.6459832191467285, 3.2417006492614746, 3.8374180793762207, 4.433135032653809, 5.028852462768555, 5.624569892883301, 6.220287322998047, 6.816004753112793, 7.411722183227539, 8.007439613342285, 8.603157043457031, 9.198874473571777, 9.794591903686523, 10.39030933380127, 10.986026763916016, 11.581743240356445, 12.177461624145508, 12.773179054260254, 13.368896484375, 13.964613914489746, 14.560331344604492, 15.156048774719238, 15.751766204833984, 16.347482681274414, 16.943199157714844, 17.538915634155273, 18.134634017944336, 18.730350494384766, 19.326068878173828, 19.921785354614258, 20.51750373840332, 21.11322021484375, 21.708938598632812, 22.304655075073242, 22.900373458862305, 23.496089935302734, 24.091808319091797, 24.687524795532227, 25.28324317932129, 25.87895965576172, 26.47467803955078]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 3.0, 7.0, 7.0, 5.0, 6.0, 9.0, 16.0, 29.0, 86.0, 130.0, 89.0, 36.0, 13.0, 12.0, 6.0, 5.0, 5.0, 6.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.590359687805176, -8.335735321044922, -8.081110954284668, -7.826486587524414, -7.57186222076416, -7.317237854003906, -7.062613487243652, -6.807989120483398, -6.5533647537231445, -6.298740386962891, -6.044116020202637, -5.789491653442383, -5.534867286682129, -5.280242919921875, -5.025618553161621, -4.770994186401367, -4.516369819641113, -4.261745452880859, -4.0071210861206055, -3.7524967193603516, -3.4978723526000977, -3.2432479858398438, -2.98862361907959, -2.733999252319336, -2.479374885559082, -2.224750518798828, -1.9701261520385742, -1.7155017852783203, -1.4608774185180664, -1.2062530517578125, -0.9516286849975586, -0.6970043182373047, -0.4423809051513672, -0.18775653839111328, 0.06686782836914062, 0.32149219512939453, 0.5761165618896484, 0.8307409286499023, 1.0853652954101562, 1.3399896621704102, 1.594614028930664, 1.849238395690918, 2.103862762451172, 2.358487129211426, 2.6131114959716797, 2.8677358627319336, 3.1223602294921875, 3.3769845962524414, 3.6316089630126953, 3.886233329772949, 4.140857696533203, 4.395482063293457, 4.650106430053711, 4.904730796813965, 5.159355163574219, 5.413979530334473, 5.668603897094727, 5.9232282638549805, 6.177852630615234, 6.432476997375488, 6.687101364135742, 6.941725730895996, 7.19635009765625, 7.450974464416504, 7.705598831176758]}, "eval/loss": 4.188705921173096, "eval/wer": 2.4265370884569615, "eval/runtime": 1107.9648, "eval/samples_per_second": 2.385, "eval/steps_per_second": 0.299, "train/train_runtime": 8514.9113, "train/train_samples_per_second": 3.352, "train/train_steps_per_second": 0.21, "train/total_flos": 0.0, "train/train_loss": 4.24715919291492, "_wandb": {"runtime": 9966}} \ No newline at end of file