{"train/loss": 4.25, "train/learning_rate": 8.960000000000001e-05, "train/epoch": 0.88, "train/global_step": 450, "_runtime": 4102, "_timestamp": 1646207109, "_step": 449, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 66.0, 572.0, 347.0, 29.0], "bins": [-787.8201904296875, -775.0996704101562, -762.379150390625, -749.65869140625, -736.9381713867188, -724.2176513671875, -711.4971923828125, -698.7766723632812, -686.05615234375, -673.3356323242188, -660.6151123046875, -647.8946533203125, -635.1741333007812, -622.45361328125, -609.733154296875, -597.0126342773438, -584.2921142578125, -571.5715942382812, -558.85107421875, -546.130615234375, -533.4100952148438, -520.6895751953125, -507.9690856933594, -495.24859619140625, -482.528076171875, -469.80755615234375, -457.0870666503906, -444.3665771484375, -431.64605712890625, -418.925537109375, -406.2050476074219, -393.48455810546875, -380.7640686035156, -368.0435791015625, -355.32305908203125, -342.6025390625, -329.8820495605469, -317.16156005859375, -304.4410400390625, -291.72052001953125, -279.0000305175781, -266.279541015625, -253.55902099609375, -240.83851623535156, -228.11801147460938, -215.3975067138672, -202.677001953125, -189.9564971923828, -177.23597717285156, -164.51547241210938, -151.7949676513672, -139.074462890625, -126.35395812988281, -113.63345336914062, -100.91294860839844, -88.19244384765625, -75.47193908691406, -62.751434326171875, -50.03092956542969, -37.3104248046875, -24.589920043945312, -11.869415283203125, 0.8510894775390625, 13.57159423828125, 26.292097091674805]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 4.0, 4.0, 8.0, 6.0, 5.0, 6.0, 17.0, 20.0, 24.0, 21.0, 23.0, 24.0, 38.0, 26.0, 40.0, 46.0, 50.0, 47.0, 52.0, 47.0, 54.0, 46.0, 42.0, 34.0, 51.0, 38.0, 40.0, 26.0, 30.0, 21.0, 22.0, 13.0, 22.0, 12.0, 10.0, 11.0, 7.0, 11.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-106.69377136230469, -103.13261413574219, -99.57145690917969, -96.01029968261719, -92.44914245605469, -88.88798522949219, -85.32682800292969, -81.76567077636719, -78.20451354980469, -74.64335632324219, -71.08219909667969, -67.52104187011719, -63.95988464355469, -60.39872741699219, -56.83757019042969, -53.27641296386719, -49.71525192260742, -46.15409469604492, -42.59293746948242, -39.03178024291992, -35.47062301635742, -31.90946388244629, -28.34830665588379, -24.78714942932129, -21.22599220275879, -17.66483497619629, -14.103677749633789, -10.542519569396973, -6.981362342834473, -3.4202041625976562, 0.14095306396484375, 3.7021102905273438, 7.263267517089844, 10.824424743652344, 14.385581970214844, 17.946739196777344, 21.507896423339844, 25.069055557250977, 28.630212783813477, 32.191368103027344, 35.752525329589844, 39.313682556152344, 42.874839782714844, 46.435997009277344, 49.997154235839844, 53.558311462402344, 57.119468688964844, 60.680625915527344, 64.24179077148438, 67.80294799804688, 71.36410522460938, 74.92526245117188, 78.48641967773438, 82.04757690429688, 85.60873413085938, 89.16989135742188, 92.73104858398438, 96.29220581054688, 99.85336303710938, 103.41452026367188, 106.97567749023438, 110.53683471679688, 114.09799194335938, 117.65914916992188, 121.22030639648438]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 5.0, 4.0, 4.0, 4.0, 6.0, 14.0, 20.0, 14.0, 17.0, 26.0, 13.0, 22.0, 36.0, 26.0, 34.0, 34.0, 45.0, 39.0, 42.0, 50.0, 63.0, 50.0, 35.0, 49.0, 52.0, 39.0, 34.0, 33.0, 30.0, 26.0, 25.0, 22.0, 14.0, 20.0, 10.0, 15.0, 10.0, 13.0, 6.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.578125, -5.422119140625, -5.26611328125, -5.110107421875, -4.9541015625, -4.798095703125, -4.64208984375, -4.486083984375, -4.330078125, -4.174072265625, -4.01806640625, -3.862060546875, -3.7060546875, -3.550048828125, -3.39404296875, -3.238037109375, -3.08203125, -2.926025390625, -2.77001953125, -2.614013671875, -2.4580078125, -2.302001953125, -2.14599609375, -1.989990234375, -1.833984375, -1.677978515625, -1.52197265625, -1.365966796875, -1.2099609375, -1.053955078125, -0.89794921875, -0.741943359375, -0.5859375, -0.429931640625, -0.27392578125, -0.117919921875, 0.0380859375, 0.194091796875, 0.35009765625, 0.506103515625, 0.662109375, 0.818115234375, 0.97412109375, 1.130126953125, 1.2861328125, 1.442138671875, 1.59814453125, 1.754150390625, 1.91015625, 2.066162109375, 2.22216796875, 2.378173828125, 2.5341796875, 2.690185546875, 2.84619140625, 3.002197265625, 3.158203125, 3.314208984375, 3.47021484375, 3.626220703125, 3.7822265625, 3.938232421875, 4.09423828125, 4.250244140625, 4.40625]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 1.0, 4.0, 3.0, 10.0, 3.0, 10.0, 13.0, 20.0, 31.0, 28.0, 42.0, 83.0, 109.0, 141.0, 232.0, 367.0, 623.0, 1057.0, 1983.0, 4405.0, 12095.0, 51669.0, 489014.0, 3157381.0, 409059.0, 46142.0, 10964.0, 4160.0, 1936.0, 1010.0, 602.0, 320.0, 232.0, 163.0, 114.0, 74.0, 56.0, 40.0, 31.0, 18.0, 18.0, 13.0, 5.0, 2.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.359375, -19.6181640625, -18.876953125, -18.1357421875, -17.39453125, -16.6533203125, -15.912109375, -15.1708984375, -14.4296875, -13.6884765625, -12.947265625, -12.2060546875, -11.46484375, -10.7236328125, -9.982421875, -9.2412109375, -8.5, -7.7587890625, -7.017578125, -6.2763671875, -5.53515625, -4.7939453125, -4.052734375, -3.3115234375, -2.5703125, -1.8291015625, -1.087890625, -0.3466796875, 0.39453125, 1.1357421875, 1.876953125, 2.6181640625, 3.359375, 4.1005859375, 4.841796875, 5.5830078125, 6.32421875, 7.0654296875, 7.806640625, 8.5478515625, 9.2890625, 10.0302734375, 10.771484375, 11.5126953125, 12.25390625, 12.9951171875, 13.736328125, 14.4775390625, 15.21875, 15.9599609375, 16.701171875, 17.4423828125, 18.18359375, 18.9248046875, 19.666015625, 20.4072265625, 21.1484375, 21.8896484375, 22.630859375, 23.3720703125, 24.11328125, 24.8544921875, 25.595703125, 26.3369140625, 27.078125]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 6.0, 9.0, 17.0, 36.0, 70.0, 89.0, 129.0, 199.0, 353.0, 540.0, 666.0, 633.0, 442.0, 290.0, 213.0, 145.0, 78.0, 44.0, 39.0, 25.0, 13.0, 8.0, 9.0, 12.0, 5.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.703125, -26.8828125, -26.0625, -25.2421875, -24.421875, -23.6015625, -22.78125, -21.9609375, -21.140625, -20.3203125, -19.5, -18.6796875, -17.859375, -17.0390625, -16.21875, -15.3984375, -14.578125, -13.7578125, -12.9375, -12.1171875, -11.296875, -10.4765625, -9.65625, -8.8359375, -8.015625, -7.1953125, -6.375, -5.5546875, -4.734375, -3.9140625, -3.09375, -2.2734375, -1.453125, -0.6328125, 0.1875, 1.0078125, 1.828125, 2.6484375, 3.46875, 4.2890625, 5.109375, 5.9296875, 6.75, 7.5703125, 8.390625, 9.2109375, 10.03125, 10.8515625, 11.671875, 12.4921875, 13.3125, 14.1328125, 14.953125, 15.7734375, 16.59375, 17.4140625, 18.234375, 19.0546875, 19.875, 20.6953125, 21.515625, 22.3359375, 23.15625, 23.9765625, 24.796875]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 4.0, 5.0, 6.0, 3.0, 6.0, 16.0, 30.0, 33.0, 69.0, 132.0, 205.0, 358.0, 681.0, 1499.0, 6302.0, 356888.0, 3780150.0, 42594.0, 2923.0, 1053.0, 539.0, 285.0, 191.0, 112.0, 64.0, 35.0, 22.0, 25.0, 14.0, 13.0, 10.0, 6.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-82.3125, -79.763671875, -77.21484375, -74.666015625, -72.1171875, -69.568359375, -67.01953125, -64.470703125, -61.921875, -59.373046875, -56.82421875, -54.275390625, -51.7265625, -49.177734375, -46.62890625, -44.080078125, -41.53125, -38.982421875, -36.43359375, -33.884765625, -31.3359375, -28.787109375, -26.23828125, -23.689453125, -21.140625, -18.591796875, -16.04296875, -13.494140625, -10.9453125, -8.396484375, -5.84765625, -3.298828125, -0.75, 1.798828125, 4.34765625, 6.896484375, 9.4453125, 11.994140625, 14.54296875, 17.091796875, 19.640625, 22.189453125, 24.73828125, 27.287109375, 29.8359375, 32.384765625, 34.93359375, 37.482421875, 40.03125, 42.580078125, 45.12890625, 47.677734375, 50.2265625, 52.775390625, 55.32421875, 57.873046875, 60.421875, 62.970703125, 65.51953125, 68.068359375, 70.6171875, 73.166015625, 75.71484375, 78.263671875, 80.8125]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 32.0, 662.0, 303.0, 15.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-717.9820556640625, -702.9147338867188, -687.8473510742188, -672.780029296875, -657.712646484375, -642.6453247070312, -627.5779418945312, -612.5106201171875, -597.4432373046875, -582.3759155273438, -567.3085327148438, -552.2412109375, -537.173828125, -522.1065063476562, -507.0391540527344, -491.9718017578125, -476.90447998046875, -461.8371276855469, -446.769775390625, -431.7024230957031, -416.63507080078125, -401.5677490234375, -386.5003967285156, -371.43304443359375, -356.3656921386719, -341.29833984375, -326.2309875488281, -311.16363525390625, -296.0963134765625, -281.0289306640625, -265.96160888671875, -250.89425659179688, -235.82688903808594, -220.75953674316406, -205.69219970703125, -190.62484741210938, -175.5574951171875, -160.49014282226562, -145.42279052734375, -130.35545349121094, -115.28810119628906, -100.22074890136719, -85.15340423583984, -70.0860595703125, -55.018707275390625, -39.95135498046875, -24.884010314941406, -9.816665649414062, 5.2506866455078125, 20.318035125732422, 35.38538360595703, 50.45273208618164, 65.52008056640625, 80.58743286132812, 95.65477752685547, 110.72212219238281, 125.78947448730469, 140.85682678222656, 155.92416381835938, 170.99151611328125, 186.05886840820312, 201.126220703125, 216.19357299804688, 231.2609100341797, 246.32826232910156]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 6.0, 4.0, 7.0, 9.0, 9.0, 9.0, 19.0, 23.0, 22.0, 34.0, 32.0, 33.0, 36.0, 47.0, 53.0, 40.0, 60.0, 58.0, 71.0, 56.0, 41.0, 51.0, 40.0, 33.0, 41.0, 32.0, 31.0, 23.0, 17.0, 15.0, 15.0, 6.0, 11.0, 5.0, 7.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0], "bins": [-140.79763793945312, -137.32191467285156, -133.84619140625, -130.37046813964844, -126.89473724365234, -123.41901397705078, -119.94328308105469, -116.46755981445312, -112.99183654785156, -109.51611328125, -106.04039001464844, -102.56465911865234, -99.08893585205078, -95.61321258544922, -92.13748168945312, -88.66175842285156, -85.18603515625, -81.71031188964844, -78.23458862304688, -74.75885772705078, -71.28313446044922, -67.80741119384766, -64.33168029785156, -60.85595703125, -57.38023376464844, -53.904510498046875, -50.42878341674805, -46.95305633544922, -43.477333068847656, -40.001609802246094, -36.525882720947266, -33.05015563964844, -29.574424743652344, -26.09869956970215, -22.622974395751953, -19.147249221801758, -15.671524047851562, -12.195798873901367, -8.720073699951172, -5.244348526000977, -1.7686233520507812, 1.707101821899414, 5.182826995849609, 8.658552169799805, 12.13427734375, 15.610002517700195, 19.08572769165039, 22.561452865600586, 26.03717803955078, 29.512903213500977, 32.98862838745117, 36.46435546875, 39.94007873535156, 43.415802001953125, 46.89152908325195, 50.36725616455078, 53.842979431152344, 57.318702697753906, 60.794429779052734, 64.27015686035156, 67.74588012695312, 71.22160339355469, 74.69732666015625, 78.17305755615234, 81.6487808227539]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 6.0, 5.0, 6.0, 9.0, 12.0, 12.0, 8.0, 14.0, 15.0, 15.0, 17.0, 22.0, 22.0, 23.0, 23.0, 27.0, 42.0, 36.0, 29.0, 42.0, 35.0, 40.0, 37.0, 43.0, 39.0, 43.0, 29.0, 35.0, 45.0, 21.0, 36.0, 32.0, 19.0, 21.0, 17.0, 21.0, 16.0, 9.0, 16.0, 10.0, 13.0, 12.0, 9.0, 5.0, 8.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-4.79296875, -4.6435546875, -4.494140625, -4.3447265625, -4.1953125, -4.0458984375, -3.896484375, -3.7470703125, -3.59765625, -3.4482421875, -3.298828125, -3.1494140625, -3.0, -2.8505859375, -2.701171875, -2.5517578125, -2.40234375, -2.2529296875, -2.103515625, -1.9541015625, -1.8046875, -1.6552734375, -1.505859375, -1.3564453125, -1.20703125, -1.0576171875, -0.908203125, -0.7587890625, -0.609375, -0.4599609375, -0.310546875, -0.1611328125, -0.01171875, 0.1376953125, 0.287109375, 0.4365234375, 0.5859375, 0.7353515625, 0.884765625, 1.0341796875, 1.18359375, 1.3330078125, 1.482421875, 1.6318359375, 1.78125, 1.9306640625, 2.080078125, 2.2294921875, 2.37890625, 2.5283203125, 2.677734375, 2.8271484375, 2.9765625, 3.1259765625, 3.275390625, 3.4248046875, 3.57421875, 3.7236328125, 3.873046875, 4.0224609375, 4.171875, 4.3212890625, 4.470703125, 4.6201171875, 4.76953125]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 4.0, 1.0, 8.0, 12.0, 21.0, 27.0, 33.0, 62.0, 72.0, 124.0, 175.0, 245.0, 384.0, 537.0, 779.0, 1127.0, 1624.0, 2281.0, 3413.0, 5002.0, 7504.0, 11191.0, 16773.0, 25306.0, 38662.0, 58856.0, 87974.0, 124445.0, 161289.0, 152065.0, 114636.0, 78416.0, 52444.0, 34325.0, 22672.0, 14955.0, 9973.0, 6708.0, 4491.0, 3123.0, 2065.0, 1486.0, 1004.0, 724.0, 531.0, 313.0, 239.0, 157.0, 97.0, 69.0, 51.0, 34.0, 27.0, 9.0, 9.0, 5.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.357421875, -0.3458404541015625, -0.334259033203125, -0.3226776123046875, -0.31109619140625, -0.2995147705078125, -0.287933349609375, -0.2763519287109375, -0.2647705078125, -0.2531890869140625, -0.241607666015625, -0.2300262451171875, -0.21844482421875, -0.2068634033203125, -0.195281982421875, -0.1837005615234375, -0.172119140625, -0.1605377197265625, -0.148956298828125, -0.1373748779296875, -0.12579345703125, -0.1142120361328125, -0.102630615234375, -0.0910491943359375, -0.0794677734375, -0.0678863525390625, -0.056304931640625, -0.0447235107421875, -0.03314208984375, -0.0215606689453125, -0.009979248046875, 0.0016021728515625, 0.01318359375, 0.0247650146484375, 0.036346435546875, 0.0479278564453125, 0.05950927734375, 0.0710906982421875, 0.082672119140625, 0.0942535400390625, 0.1058349609375, 0.1174163818359375, 0.128997802734375, 0.1405792236328125, 0.15216064453125, 0.1637420654296875, 0.175323486328125, 0.1869049072265625, 0.198486328125, 0.2100677490234375, 0.221649169921875, 0.2332305908203125, 0.24481201171875, 0.2563934326171875, 0.267974853515625, 0.2795562744140625, 0.2911376953125, 0.3027191162109375, 0.314300537109375, 0.3258819580078125, 0.33746337890625, 0.3490447998046875, 0.360626220703125, 0.3722076416015625, 0.3837890625]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 1.0, 7.0, 6.0, 2.0, 5.0, 11.0, 10.0, 9.0, 10.0, 16.0, 20.0, 19.0, 25.0, 28.0, 23.0, 26.0, 33.0, 37.0, 41.0, 44.0, 48.0, 33.0, 1056.0, 42.0, 41.0, 39.0, 40.0, 34.0, 35.0, 29.0, 35.0, 35.0, 23.0, 11.0, 21.0, 22.0, 21.0, 15.0, 12.0, 9.0, 11.0, 12.0, 4.0, 6.0, 6.0, 7.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.083984375, -2.984283447265625, -2.88458251953125, -2.784881591796875, -2.6851806640625, -2.585479736328125, -2.48577880859375, -2.386077880859375, -2.286376953125, -2.186676025390625, -2.08697509765625, -1.987274169921875, -1.8875732421875, -1.787872314453125, -1.68817138671875, -1.588470458984375, -1.48876953125, -1.389068603515625, -1.28936767578125, -1.189666748046875, -1.0899658203125, -0.990264892578125, -0.89056396484375, -0.790863037109375, -0.691162109375, -0.591461181640625, -0.49176025390625, -0.392059326171875, -0.2923583984375, -0.192657470703125, -0.09295654296875, 0.006744384765625, 0.1064453125, 0.206146240234375, 0.30584716796875, 0.405548095703125, 0.5052490234375, 0.604949951171875, 0.70465087890625, 0.804351806640625, 0.904052734375, 1.003753662109375, 1.10345458984375, 1.203155517578125, 1.3028564453125, 1.402557373046875, 1.50225830078125, 1.601959228515625, 1.70166015625, 1.801361083984375, 1.90106201171875, 2.000762939453125, 2.1004638671875, 2.200164794921875, 2.29986572265625, 2.399566650390625, 2.499267578125, 2.598968505859375, 2.69866943359375, 2.798370361328125, 2.8980712890625, 2.997772216796875, 3.09747314453125, 3.197174072265625, 3.296875]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 6.0, 9.0, 7.0, 19.0, 33.0, 42.0, 65.0, 93.0, 152.0, 196.0, 317.0, 495.0, 712.0, 1139.0, 1678.0, 2633.0, 3947.0, 6174.0, 9022.0, 14139.0, 21474.0, 32713.0, 48330.0, 71075.0, 99637.0, 132923.0, 1178445.0, 142052.0, 103663.0, 74837.0, 51194.0, 34137.0, 22345.0, 15031.0, 9801.0, 6278.0, 4184.0, 2781.0, 1801.0, 1193.0, 786.0, 571.0, 337.0, 230.0, 159.0, 86.0, 65.0, 45.0, 29.0, 22.0, 18.0, 8.0, 7.0, 2.0, 2.0, 3.0], "bins": [-0.276611328125, -0.26861000061035156, -0.2606086730957031, -0.2526073455810547, -0.24460601806640625, -0.2366046905517578, -0.22860336303710938, -0.22060203552246094, -0.2126007080078125, -0.20459938049316406, -0.19659805297851562, -0.1885967254638672, -0.18059539794921875, -0.1725940704345703, -0.16459274291992188, -0.15659141540527344, -0.148590087890625, -0.14058876037597656, -0.13258743286132812, -0.12458610534667969, -0.11658477783203125, -0.10858345031738281, -0.10058212280273438, -0.09258079528808594, -0.0845794677734375, -0.07657814025878906, -0.06857681274414062, -0.06057548522949219, -0.05257415771484375, -0.04457283020019531, -0.036571502685546875, -0.028570175170898438, -0.02056884765625, -0.012567520141601562, -0.004566192626953125, 0.0034351348876953125, 0.01143646240234375, 0.019437789916992188, 0.027439117431640625, 0.03544044494628906, 0.0434417724609375, 0.05144309997558594, 0.059444427490234375, 0.06744575500488281, 0.07544708251953125, 0.08344841003417969, 0.09144973754882812, 0.09945106506347656, 0.107452392578125, 0.11545372009277344, 0.12345504760742188, 0.1314563751220703, 0.13945770263671875, 0.1474590301513672, 0.15546035766601562, 0.16346168518066406, 0.1714630126953125, 0.17946434020996094, 0.18746566772460938, 0.1954669952392578, 0.20346832275390625, 0.2114696502685547, 0.21947097778320312, 0.22747230529785156, 0.2354736328125]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 1.0, 5.0, 3.0, 4.0, 2.0, 3.0, 4.0, 7.0, 7.0, 5.0, 9.0, 10.0, 13.0, 27.0, 22.0, 39.0, 38.0, 38.0, 42.0, 52.0, 67.0, 71.0, 97.0, 67.0, 80.0, 46.0, 50.0, 29.0, 23.0, 32.0, 16.0, 18.0, 14.0, 14.0, 9.0, 9.0, 5.0, 6.0, 3.0, 2.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005405426025390625, -0.005237162113189697, -0.0050688982009887695, -0.004900634288787842, -0.004732370376586914, -0.004564106464385986, -0.004395842552185059, -0.004227578639984131, -0.004059314727783203, -0.0038910508155822754, -0.0037227869033813477, -0.00355452299118042, -0.003386259078979492, -0.0032179951667785645, -0.0030497312545776367, -0.002881467342376709, -0.0027132034301757812, -0.0025449395179748535, -0.0023766756057739258, -0.002208411693572998, -0.0020401477813720703, -0.0018718838691711426, -0.0017036199569702148, -0.0015353560447692871, -0.0013670921325683594, -0.0011988282203674316, -0.001030564308166504, -0.0008623003959655762, -0.0006940364837646484, -0.0005257725715637207, -0.00035750865936279297, -0.00018924474716186523, -2.09808349609375e-05, 0.00014728307723999023, 0.00031554698944091797, 0.0004838109016418457, 0.0006520748138427734, 0.0008203387260437012, 0.000988602638244629, 0.0011568665504455566, 0.0013251304626464844, 0.0014933943748474121, 0.0016616582870483398, 0.0018299221992492676, 0.0019981861114501953, 0.002166450023651123, 0.0023347139358520508, 0.0025029778480529785, 0.0026712417602539062, 0.002839505672454834, 0.0030077695846557617, 0.0031760334968566895, 0.003344297409057617, 0.003512561321258545, 0.0036808252334594727, 0.0038490891456604004, 0.004017353057861328, 0.004185616970062256, 0.004353880882263184, 0.004522144794464111, 0.004690408706665039, 0.004858672618865967, 0.0050269365310668945, 0.005195200443267822, 0.00536346435546875]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 6.0, 9.0, 9.0, 11.0, 9.0, 8.0, 6.0, 12.0, 17.0, 8.0, 23.0, 34.0, 45.0, 41.0, 57.0, 64.0, 100.0, 152.0, 166.0, 175.0, 328.0, 666.0, 23190.0, 1018495.0, 3289.0, 482.0, 280.0, 185.0, 131.0, 100.0, 95.0, 69.0, 54.0, 40.0, 33.0, 29.0, 24.0, 19.0, 15.0, 15.0, 13.0, 14.0, 7.0, 6.0, 5.0, 5.0, 2.0, 3.0, 3.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.09375, -0.09075736999511719, -0.08776473999023438, -0.08477210998535156, -0.08177947998046875, -0.07878684997558594, -0.07579421997070312, -0.07280158996582031, -0.0698089599609375, -0.06681632995605469, -0.06382369995117188, -0.06083106994628906, -0.05783843994140625, -0.05484580993652344, -0.051853179931640625, -0.04886054992675781, -0.045867919921875, -0.04287528991699219, -0.039882659912109375, -0.03689002990722656, -0.03389739990234375, -0.030904769897460938, -0.027912139892578125, -0.024919509887695312, -0.0219268798828125, -0.018934249877929688, -0.015941619873046875, -0.012948989868164062, -0.00995635986328125, -0.0069637298583984375, -0.003971099853515625, -0.0009784698486328125, 0.00201416015625, 0.0050067901611328125, 0.007999420166015625, 0.010992050170898438, 0.01398468017578125, 0.016977310180664062, 0.019969940185546875, 0.022962570190429688, 0.0259552001953125, 0.028947830200195312, 0.031940460205078125, 0.03493309020996094, 0.03792572021484375, 0.04091835021972656, 0.043910980224609375, 0.04690361022949219, 0.049896240234375, 0.05288887023925781, 0.055881500244140625, 0.05887413024902344, 0.06186676025390625, 0.06485939025878906, 0.06785202026367188, 0.07084465026855469, 0.0738372802734375, 0.07682991027832031, 0.07982254028320312, 0.08281517028808594, 0.08580780029296875, 0.08880043029785156, 0.09179306030273438, 0.09478569030761719, 0.0977783203125]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 29.0, 478.0, 468.0, 37.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.026848042383790016, -0.026341192424297333, -0.0258343443274498, -0.025327494367957115, -0.024820644408464432, -0.02431379444897175, -0.023806946352124214, -0.02330009639263153, -0.022793246433138847, -0.022286396473646164, -0.02177954837679863, -0.021272698417305946, -0.020765848457813263, -0.02025899849832058, -0.019752150401473045, -0.019245300441980362, -0.018738452345132828, -0.018231602385640144, -0.01772475428879261, -0.017217904329299927, -0.016711054369807243, -0.01620420441031456, -0.015697356313467026, -0.015190506353974342, -0.014683656394481659, -0.01417680736631155, -0.013669957406818867, -0.013163108378648758, -0.012656258419156075, -0.012149409390985966, -0.011642560362815857, -0.011135710403323174, -0.01062886044383049, -0.010122011415660381, -0.009615161456167698, -0.009108312427997589, -0.008601462468504906, -0.008094613440334797, -0.007587763946503401, -0.007080914452672005, -0.006574064493179321, -0.006067214999347925, -0.005560365505516529, -0.00505351647734642, -0.004546666517853737, -0.004039817489683628, -0.003532967995852232, -0.003026118502020836, -0.0025192690081894398, -0.0020124195143580437, -0.0015055701369419694, -0.0009987207595258951, -0.000491871265694499, 1.4978228136897087e-05, 0.0005218274891376495, 0.0010286769829690456, 0.0015355264768004417, 0.002042375970631838, 0.002549225464463234, 0.0030560747254639864, 0.0035629242192953825, 0.004069773480296135, 0.004576622974127531, 0.005083472467958927, 0.005590321961790323]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 3.0, 5.0, 4.0, 4.0, 6.0, 8.0, 7.0, 9.0, 10.0, 17.0, 12.0, 11.0, 24.0, 24.0, 20.0, 20.0, 26.0, 29.0, 42.0, 24.0, 31.0, 30.0, 38.0, 37.0, 37.0, 35.0, 44.0, 44.0, 39.0, 47.0, 35.0, 36.0, 32.0, 31.0, 26.0, 18.0, 15.0, 20.0, 23.0, 20.0, 7.0, 14.0, 8.0, 6.0, 9.0, 2.0, 5.0, 8.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.002948284149169922, -0.0028636185452342033, -0.002778952941298485, -0.0026942873373627663, -0.0026096217334270477, -0.002524956129491329, -0.0024402905255556107, -0.002355624921619892, -0.0022709593176841736, -0.002186293713748455, -0.0021016281098127365, -0.002016962505877018, -0.0019322969019412994, -0.001847631298005581, -0.0017629656940698624, -0.0016783000901341438, -0.0015936344861984253, -0.0015089688822627068, -0.0014243032783269882, -0.0013396376743912697, -0.0012549720704555511, -0.0011703064665198326, -0.001085640862584114, -0.0010009752586483955, -0.000916309654712677, -0.0008316440507769585, -0.0007469784468412399, -0.0006623128429055214, -0.0005776472389698029, -0.0004929816350340843, -0.0004083160310983658, -0.00032365042716264725, -0.0002389848232269287, -0.00015431921929121017, -6.965361535549164e-05, 1.5011988580226898e-05, 9.967759251594543e-05, 0.00018434319645166397, 0.0002690088003873825, 0.00035367440432310104, 0.0004383400082588196, 0.0005230056121945381, 0.0006076712161302567, 0.0006923368200659752, 0.0007770024240016937, 0.0008616680279374123, 0.0009463336318731308, 0.0010309992358088493, 0.0011156648397445679, 0.0012003304436802864, 0.001284996047616005, 0.0013696616515517235, 0.001454327255487442, 0.0015389928594231606, 0.001623658463358879, 0.0017083240672945976, 0.0017929896712303162, 0.0018776552751660347, 0.0019623208791017532, 0.0020469864830374718, 0.0021316520869731903, 0.002216317690908909, 0.0023009832948446274, 0.002385648898780346, 0.0024703145027160645]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 6.0, 5.0, 6.0, 9.0, 12.0, 12.0, 8.0, 14.0, 15.0, 15.0, 17.0, 22.0, 22.0, 23.0, 23.0, 27.0, 42.0, 36.0, 29.0, 42.0, 35.0, 40.0, 37.0, 43.0, 39.0, 43.0, 29.0, 35.0, 45.0, 21.0, 36.0, 32.0, 19.0, 21.0, 17.0, 21.0, 16.0, 9.0, 16.0, 10.0, 13.0, 12.0, 9.0, 5.0, 8.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-4.79296875, -4.6435546875, -4.494140625, -4.3447265625, -4.1953125, -4.0458984375, -3.896484375, -3.7470703125, -3.59765625, -3.4482421875, -3.298828125, -3.1494140625, -3.0, -2.8505859375, -2.701171875, -2.5517578125, -2.40234375, -2.2529296875, -2.103515625, -1.9541015625, -1.8046875, -1.6552734375, -1.505859375, -1.3564453125, -1.20703125, -1.0576171875, -0.908203125, -0.7587890625, -0.609375, -0.4599609375, -0.310546875, -0.1611328125, -0.01171875, 0.1376953125, 0.287109375, 0.4365234375, 0.5859375, 0.7353515625, 0.884765625, 1.0341796875, 1.18359375, 1.3330078125, 1.482421875, 1.6318359375, 1.78125, 1.9306640625, 2.080078125, 2.2294921875, 2.37890625, 2.5283203125, 2.677734375, 2.8271484375, 2.9765625, 3.1259765625, 3.275390625, 3.4248046875, 3.57421875, 3.7236328125, 3.873046875, 4.0224609375, 4.171875, 4.3212890625, 4.470703125, 4.6201171875, 4.76953125]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 10.0, 12.0, 23.0, 25.0, 46.0, 58.0, 87.0, 123.0, 153.0, 260.0, 383.0, 545.0, 782.0, 1145.0, 1549.0, 2166.0, 3297.0, 4939.0, 7800.0, 13853.0, 30573.0, 96732.0, 425654.0, 325718.0, 73711.0, 25486.0, 12118.0, 6957.0, 4470.0, 3031.0, 2043.0, 1431.0, 1033.0, 745.0, 483.0, 337.0, 221.0, 175.0, 111.0, 78.0, 70.0, 42.0, 27.0, 21.0, 13.0, 9.0, 5.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-15.046875, -14.5894775390625, -14.132080078125, -13.6746826171875, -13.21728515625, -12.7598876953125, -12.302490234375, -11.8450927734375, -11.3876953125, -10.9302978515625, -10.472900390625, -10.0155029296875, -9.55810546875, -9.1007080078125, -8.643310546875, -8.1859130859375, -7.728515625, -7.2711181640625, -6.813720703125, -6.3563232421875, -5.89892578125, -5.4415283203125, -4.984130859375, -4.5267333984375, -4.0693359375, -3.6119384765625, -3.154541015625, -2.6971435546875, -2.23974609375, -1.7823486328125, -1.324951171875, -0.8675537109375, -0.41015625, 0.0472412109375, 0.504638671875, 0.9620361328125, 1.41943359375, 1.8768310546875, 2.334228515625, 2.7916259765625, 3.2490234375, 3.7064208984375, 4.163818359375, 4.6212158203125, 5.07861328125, 5.5360107421875, 5.993408203125, 6.4508056640625, 6.908203125, 7.3656005859375, 7.822998046875, 8.2803955078125, 8.73779296875, 9.1951904296875, 9.652587890625, 10.1099853515625, 10.5673828125, 11.0247802734375, 11.482177734375, 11.9395751953125, 12.39697265625, 12.8543701171875, 13.311767578125, 13.7691650390625, 14.2265625]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 4.0, 3.0, 2.0, 6.0, 4.0, 13.0, 13.0, 12.0, 10.0, 19.0, 26.0, 27.0, 34.0, 42.0, 44.0, 54.0, 81.0, 93.0, 149.0, 1573.0, 369.0, 82.0, 70.0, 49.0, 59.0, 42.0, 38.0, 33.0, 34.0, 19.0, 14.0, 8.0, 7.0, 7.0, 4.0, 6.0, 6.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.953125, -24.236328125, -23.51953125, -22.802734375, -22.0859375, -21.369140625, -20.65234375, -19.935546875, -19.21875, -18.501953125, -17.78515625, -17.068359375, -16.3515625, -15.634765625, -14.91796875, -14.201171875, -13.484375, -12.767578125, -12.05078125, -11.333984375, -10.6171875, -9.900390625, -9.18359375, -8.466796875, -7.75, -7.033203125, -6.31640625, -5.599609375, -4.8828125, -4.166015625, -3.44921875, -2.732421875, -2.015625, -1.298828125, -0.58203125, 0.134765625, 0.8515625, 1.568359375, 2.28515625, 3.001953125, 3.71875, 4.435546875, 5.15234375, 5.869140625, 6.5859375, 7.302734375, 8.01953125, 8.736328125, 9.453125, 10.169921875, 10.88671875, 11.603515625, 12.3203125, 13.037109375, 13.75390625, 14.470703125, 15.1875, 15.904296875, 16.62109375, 17.337890625, 18.0546875, 18.771484375, 19.48828125, 20.205078125, 20.921875]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 2.0, 5.0, 8.0, 8.0, 13.0, 15.0, 26.0, 21.0, 35.0, 35.0, 59.0, 75.0, 116.0, 323.0, 1770.0, 2951074.0, 190376.0, 1048.0, 276.0, 110.0, 76.0, 38.0, 44.0, 32.0, 31.0, 21.0, 8.0, 14.0, 11.0, 16.0, 5.0, 6.0, 2.0, 4.0, 3.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-95.8125, -92.708984375, -89.60546875, -86.501953125, -83.3984375, -80.294921875, -77.19140625, -74.087890625, -70.984375, -67.880859375, -64.77734375, -61.673828125, -58.5703125, -55.466796875, -52.36328125, -49.259765625, -46.15625, -43.052734375, -39.94921875, -36.845703125, -33.7421875, -30.638671875, -27.53515625, -24.431640625, -21.328125, -18.224609375, -15.12109375, -12.017578125, -8.9140625, -5.810546875, -2.70703125, 0.396484375, 3.5, 6.603515625, 9.70703125, 12.810546875, 15.9140625, 19.017578125, 22.12109375, 25.224609375, 28.328125, 31.431640625, 34.53515625, 37.638671875, 40.7421875, 43.845703125, 46.94921875, 50.052734375, 53.15625, 56.259765625, 59.36328125, 62.466796875, 65.5703125, 68.673828125, 71.77734375, 74.880859375, 77.984375, 81.087890625, 84.19140625, 87.294921875, 90.3984375, 93.501953125, 96.60546875, 99.708984375, 102.8125]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 246.0, 762.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.12577819824219, -39.5609130859375, -29.996047973632812, -20.431182861328125, -10.866317749023438, -1.30145263671875, 8.263412475585938, 17.828277587890625, 27.393142700195312, 36.9580078125, 46.52287292480469, 56.087738037109375, 65.65260314941406, 75.21746826171875, 84.78233337402344, 94.34719848632812, 103.91206359863281, 113.4769287109375, 123.04179382324219, 132.60665893554688, 142.17152404785156, 151.73638916015625, 161.30125427246094, 170.86611938476562, 180.4309844970703, 189.995849609375, 199.5607147216797, 209.12557983398438, 218.69044494628906, 228.25531005859375, 237.82017517089844, 247.38504028320312, 256.94989013671875, 266.5147705078125, 276.0796203613281, 285.64447021484375, 295.2093505859375, 304.77423095703125, 314.3390808105469, 323.9039306640625, 333.46881103515625, 343.03369140625, 352.5985412597656, 362.16339111328125, 371.728271484375, 381.29315185546875, 390.8580017089844, 400.4228515625, 409.98773193359375, 419.5526123046875, 429.1174621582031, 438.68231201171875, 448.2471923828125, 457.81207275390625, 467.3769226074219, 476.9417724609375, 486.50665283203125, 496.071533203125, 505.6363830566406, 515.2012329101562, 524.76611328125, 534.3309936523438, 543.8958740234375, 553.460693359375, 563.0255737304688]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 7.0, 5.0, 5.0, 12.0, 9.0, 20.0, 15.0, 15.0, 18.0, 21.0, 16.0, 29.0, 25.0, 35.0, 36.0, 42.0, 45.0, 40.0, 39.0, 31.0, 32.0, 37.0, 42.0, 40.0, 45.0, 39.0, 29.0, 39.0, 36.0, 25.0, 21.0, 23.0, 22.0, 17.0, 16.0, 15.0, 15.0, 7.0, 8.0, 8.0, 6.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0], "bins": [-54.32135009765625, -52.57880783081055, -50.83626174926758, -49.093719482421875, -47.351173400878906, -45.6086311340332, -43.866085052490234, -42.12354278564453, -40.38099670410156, -38.63845443725586, -36.89590835571289, -35.15336608886719, -33.41082000732422, -31.668277740478516, -29.925731658935547, -28.183189392089844, -26.440645217895508, -24.698101043701172, -22.955556869506836, -21.2130126953125, -19.470468521118164, -17.727924346923828, -15.985381126403809, -14.242836952209473, -12.500292778015137, -10.7577486038208, -9.015204429626465, -7.272660732269287, -5.530116558074951, -3.7875728607177734, -2.0450286865234375, -0.30248451232910156, 1.4400596618652344, 3.1826038360595703, 4.925148010253906, 6.667691707611084, 8.410236358642578, 10.152779579162598, 11.895323753356934, 13.63786792755127, 15.380412101745605, 17.122955322265625, 18.86549949645996, 20.608043670654297, 22.350587844848633, 24.09313201904297, 25.835676193237305, 27.57822036743164, 29.320764541625977, 31.063308715820312, 32.805850982666016, 34.548397064208984, 36.29093933105469, 38.033485412597656, 39.77602767944336, 41.51857376098633, 43.26111602783203, 45.003658294677734, 46.7462043762207, 48.488746643066406, 50.231292724609375, 51.97383499145508, 53.71638107299805, 55.45892333984375, 57.20146942138672]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 6.0, 14.0, 11.0, 7.0, 10.0, 9.0, 16.0, 21.0, 19.0, 21.0, 22.0, 23.0, 36.0, 29.0, 30.0, 37.0, 32.0, 41.0, 43.0, 37.0, 48.0, 47.0, 38.0, 43.0, 35.0, 40.0, 37.0, 28.0, 23.0, 30.0, 12.0, 28.0, 17.0, 18.0, 19.0, 11.0, 11.0, 11.0, 9.0, 10.0, 6.0, 5.0, 3.0, 4.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.30859375, -5.14068603515625, -4.9727783203125, -4.80487060546875, -4.636962890625, -4.46905517578125, -4.3011474609375, -4.13323974609375, -3.96533203125, -3.79742431640625, -3.6295166015625, -3.46160888671875, -3.293701171875, -3.12579345703125, -2.9578857421875, -2.78997802734375, -2.6220703125, -2.45416259765625, -2.2862548828125, -2.11834716796875, -1.950439453125, -1.78253173828125, -1.6146240234375, -1.44671630859375, -1.27880859375, -1.11090087890625, -0.9429931640625, -0.77508544921875, -0.607177734375, -0.43927001953125, -0.2713623046875, -0.10345458984375, 0.064453125, 0.23236083984375, 0.4002685546875, 0.56817626953125, 0.736083984375, 0.90399169921875, 1.0718994140625, 1.23980712890625, 1.40771484375, 1.57562255859375, 1.7435302734375, 1.91143798828125, 2.079345703125, 2.24725341796875, 2.4151611328125, 2.58306884765625, 2.7509765625, 2.91888427734375, 3.0867919921875, 3.25469970703125, 3.422607421875, 3.59051513671875, 3.7584228515625, 3.92633056640625, 4.09423828125, 4.26214599609375, 4.4300537109375, 4.59796142578125, 4.765869140625, 4.93377685546875, 5.1016845703125, 5.26959228515625, 5.4375]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 2.0, 8.0, 7.0, 10.0, 16.0, 17.0, 43.0, 36.0, 54.0, 80.0, 88.0, 126.0, 152.0, 222.0, 372.0, 587.0, 1363.0, 3971.0, 19785.0, 187525.0, 3074949.0, 839735.0, 52480.0, 8132.0, 2172.0, 840.0, 455.0, 259.0, 195.0, 137.0, 141.0, 83.0, 63.0, 40.0, 36.0, 28.0, 24.0, 12.0, 11.0, 8.0, 5.0, 4.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.5625, -25.63818359375, -24.7138671875, -23.78955078125, -22.865234375, -21.94091796875, -21.0166015625, -20.09228515625, -19.16796875, -18.24365234375, -17.3193359375, -16.39501953125, -15.470703125, -14.54638671875, -13.6220703125, -12.69775390625, -11.7734375, -10.84912109375, -9.9248046875, -9.00048828125, -8.076171875, -7.15185546875, -6.2275390625, -5.30322265625, -4.37890625, -3.45458984375, -2.5302734375, -1.60595703125, -0.681640625, 0.24267578125, 1.1669921875, 2.09130859375, 3.015625, 3.93994140625, 4.8642578125, 5.78857421875, 6.712890625, 7.63720703125, 8.5615234375, 9.48583984375, 10.41015625, 11.33447265625, 12.2587890625, 13.18310546875, 14.107421875, 15.03173828125, 15.9560546875, 16.88037109375, 17.8046875, 18.72900390625, 19.6533203125, 20.57763671875, 21.501953125, 22.42626953125, 23.3505859375, 24.27490234375, 25.19921875, 26.12353515625, 27.0478515625, 27.97216796875, 28.896484375, 29.82080078125, 30.7451171875, 31.66943359375, 32.59375]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 7.0, 10.0, 25.0, 40.0, 79.0, 172.0, 337.0, 559.0, 796.0, 814.0, 559.0, 328.0, 173.0, 87.0, 53.0, 21.0, 12.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.96875, -32.798828125, -31.62890625, -30.458984375, -29.2890625, -28.119140625, -26.94921875, -25.779296875, -24.609375, -23.439453125, -22.26953125, -21.099609375, -19.9296875, -18.759765625, -17.58984375, -16.419921875, -15.25, -14.080078125, -12.91015625, -11.740234375, -10.5703125, -9.400390625, -8.23046875, -7.060546875, -5.890625, -4.720703125, -3.55078125, -2.380859375, -1.2109375, -0.041015625, 1.12890625, 2.298828125, 3.46875, 4.638671875, 5.80859375, 6.978515625, 8.1484375, 9.318359375, 10.48828125, 11.658203125, 12.828125, 13.998046875, 15.16796875, 16.337890625, 17.5078125, 18.677734375, 19.84765625, 21.017578125, 22.1875, 23.357421875, 24.52734375, 25.697265625, 26.8671875, 28.037109375, 29.20703125, 30.376953125, 31.546875, 32.716796875, 33.88671875, 35.056640625, 36.2265625, 37.396484375, 38.56640625, 39.736328125, 40.90625]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 3.0, 4.0, 0.0, 3.0, 6.0, 11.0, 26.0, 38.0, 81.0, 201.0, 567.0, 3088.0, 224214.0, 3934861.0, 28976.0, 1603.0, 361.0, 149.0, 52.0, 20.0, 12.0, 12.0, 7.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.84375, -44.50244140625, -41.1611328125, -37.81982421875, -34.478515625, -31.13720703125, -27.7958984375, -24.45458984375, -21.11328125, -17.77197265625, -14.4306640625, -11.08935546875, -7.748046875, -4.40673828125, -1.0654296875, 2.27587890625, 5.6171875, 8.95849609375, 12.2998046875, 15.64111328125, 18.982421875, 22.32373046875, 25.6650390625, 29.00634765625, 32.34765625, 35.68896484375, 39.0302734375, 42.37158203125, 45.712890625, 49.05419921875, 52.3955078125, 55.73681640625, 59.078125, 62.41943359375, 65.7607421875, 69.10205078125, 72.443359375, 75.78466796875, 79.1259765625, 82.46728515625, 85.80859375, 89.14990234375, 92.4912109375, 95.83251953125, 99.173828125, 102.51513671875, 105.8564453125, 109.19775390625, 112.5390625, 115.88037109375, 119.2216796875, 122.56298828125, 125.904296875, 129.24560546875, 132.5869140625, 135.92822265625, 139.26953125, 142.61083984375, 145.9521484375, 149.29345703125, 152.634765625, 155.97607421875, 159.3173828125, 162.65869140625, 166.0]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 17.0, 289.0, 619.0, 86.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-78.49221801757812, -63.72492980957031, -48.957645416259766, -34.19036102294922, -19.423072814941406, -4.655784606933594, 10.111495971679688, 24.8787841796875, 39.64607238769531, 54.413360595703125, 69.18064880371094, 83.94792938232422, 98.71521759033203, 113.48250579833984, 128.24978637695312, 143.01707458496094, 157.78436279296875, 172.55165100097656, 187.31893920898438, 202.08621215820312, 216.853515625, 231.62078857421875, 246.38807678222656, 261.1553649902344, 275.92266845703125, 290.68994140625, 305.4572448730469, 320.2245178222656, 334.9918212890625, 349.75909423828125, 364.5263671875, 379.2936706542969, 394.0609130859375, 408.82818603515625, 423.5954895019531, 438.3627624511719, 453.13006591796875, 467.8973388671875, 482.66461181640625, 497.4319152832031, 512.19921875, 526.9664916992188, 541.7337646484375, 556.5010986328125, 571.2683715820312, 586.03564453125, 600.8029174804688, 615.5701904296875, 630.3375244140625, 645.1047973632812, 659.8720703125, 674.639404296875, 689.4066772460938, 704.1739501953125, 718.9412231445312, 733.70849609375, 748.4757690429688, 763.2430419921875, 778.0103149414062, 792.7776489257812, 807.544921875, 822.3121948242188, 837.0794677734375, 851.8468017578125, 866.6140747070312]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 1.0, 2.0, 8.0, 7.0, 4.0, 6.0, 14.0, 16.0, 21.0, 16.0, 17.0, 22.0, 23.0, 31.0, 33.0, 33.0, 36.0, 33.0, 40.0, 39.0, 43.0, 25.0, 43.0, 44.0, 33.0, 41.0, 39.0, 49.0, 28.0, 32.0, 27.0, 33.0, 25.0, 15.0, 19.0, 24.0, 16.0, 12.0, 10.0, 9.0, 3.0, 10.0, 2.0, 4.0, 3.0, 3.0, 6.0, 0.0, 6.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-67.44198608398438, -65.38399505615234, -63.32600402832031, -61.26801681518555, -59.210025787353516, -57.152034759521484, -55.09404754638672, -53.03605651855469, -50.978065490722656, -48.920074462890625, -46.862083435058594, -44.80409622192383, -42.7461051940918, -40.688114166259766, -38.630126953125, -36.57213592529297, -34.51414489746094, -32.456153869628906, -30.398164749145508, -28.34017562866211, -26.282184600830078, -24.224193572998047, -22.16620445251465, -20.10821533203125, -18.05022430419922, -15.992234230041504, -13.934244155883789, -11.876254081726074, -9.81826400756836, -7.7602739334106445, -5.70228385925293, -3.644293785095215, -1.5863113403320312, 0.4716787338256836, 2.5296688079833984, 4.587658882141113, 6.645648956298828, 8.703639030456543, 10.761629104614258, 12.819619178771973, 14.877609252929688, 16.93560028076172, 18.993589401245117, 21.051578521728516, 23.109569549560547, 25.167560577392578, 27.225549697875977, 29.283538818359375, 31.341529846191406, 33.39952087402344, 35.45751190185547, 37.515499114990234, 39.573490142822266, 41.6314811706543, 43.68946838378906, 45.747459411621094, 47.805450439453125, 49.863441467285156, 51.92143249511719, 53.97941970825195, 56.037410736083984, 58.095401763916016, 60.15338897705078, 62.21138000488281, 64.26937103271484]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 5.0, 6.0, 6.0, 12.0, 8.0, 14.0, 9.0, 13.0, 15.0, 15.0, 16.0, 21.0, 22.0, 27.0, 41.0, 19.0, 30.0, 49.0, 36.0, 39.0, 44.0, 43.0, 37.0, 37.0, 40.0, 46.0, 38.0, 24.0, 30.0, 34.0, 28.0, 27.0, 23.0, 25.0, 21.0, 13.0, 12.0, 17.0, 18.0, 8.0, 12.0, 6.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0], "bins": [-5.671875, -5.5020751953125, -5.332275390625, -5.1624755859375, -4.99267578125, -4.8228759765625, -4.653076171875, -4.4832763671875, -4.3134765625, -4.1436767578125, -3.973876953125, -3.8040771484375, -3.63427734375, -3.4644775390625, -3.294677734375, -3.1248779296875, -2.955078125, -2.7852783203125, -2.615478515625, -2.4456787109375, -2.27587890625, -2.1060791015625, -1.936279296875, -1.7664794921875, -1.5966796875, -1.4268798828125, -1.257080078125, -1.0872802734375, -0.91748046875, -0.7476806640625, -0.577880859375, -0.4080810546875, -0.23828125, -0.0684814453125, 0.101318359375, 0.2711181640625, 0.44091796875, 0.6107177734375, 0.780517578125, 0.9503173828125, 1.1201171875, 1.2899169921875, 1.459716796875, 1.6295166015625, 1.79931640625, 1.9691162109375, 2.138916015625, 2.3087158203125, 2.478515625, 2.6483154296875, 2.818115234375, 2.9879150390625, 3.15771484375, 3.3275146484375, 3.497314453125, 3.6671142578125, 3.8369140625, 4.0067138671875, 4.176513671875, 4.3463134765625, 4.51611328125, 4.6859130859375, 4.855712890625, 5.0255126953125, 5.1953125]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 3.0, 7.0, 7.0, 16.0, 19.0, 32.0, 48.0, 97.0, 135.0, 208.0, 312.0, 460.0, 740.0, 1051.0, 1620.0, 2466.0, 3673.0, 5833.0, 9152.0, 14074.0, 22117.0, 35692.0, 58344.0, 93019.0, 139363.0, 178247.0, 163753.0, 116857.0, 75255.0, 46603.0, 28901.0, 18038.0, 11311.0, 7304.0, 4666.0, 3074.0, 2091.0, 1377.0, 889.0, 597.0, 384.0, 244.0, 188.0, 106.0, 67.0, 58.0, 27.0, 22.0, 8.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.482177734375, -0.4678993225097656, -0.45362091064453125, -0.4393424987792969, -0.4250640869140625, -0.4107856750488281, -0.39650726318359375, -0.3822288513183594, -0.367950439453125, -0.3536720275878906, -0.33939361572265625, -0.3251152038574219, -0.3108367919921875, -0.2965583801269531, -0.28227996826171875, -0.2680015563964844, -0.25372314453125, -0.23944473266601562, -0.22516632080078125, -0.21088790893554688, -0.1966094970703125, -0.18233108520507812, -0.16805267333984375, -0.15377426147460938, -0.139495849609375, -0.12521743774414062, -0.11093902587890625, -0.09666061401367188, -0.0823822021484375, -0.06810379028320312, -0.05382537841796875, -0.039546966552734375, -0.0252685546875, -0.010990142822265625, 0.00328826904296875, 0.017566680908203125, 0.0318450927734375, 0.046123504638671875, 0.06040191650390625, 0.07468032836914062, 0.088958740234375, 0.10323715209960938, 0.11751556396484375, 0.13179397583007812, 0.1460723876953125, 0.16035079956054688, 0.17462921142578125, 0.18890762329101562, 0.20318603515625, 0.21746444702148438, 0.23174285888671875, 0.24602127075195312, 0.2602996826171875, 0.2745780944824219, 0.28885650634765625, 0.3031349182128906, 0.317413330078125, 0.3316917419433594, 0.34597015380859375, 0.3602485656738281, 0.3745269775390625, 0.3888053894042969, 0.40308380126953125, 0.4173622131347656, 0.431640625]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 6.0, 0.0, 3.0, 3.0, 5.0, 3.0, 6.0, 10.0, 15.0, 20.0, 24.0, 17.0, 22.0, 27.0, 25.0, 33.0, 37.0, 39.0, 37.0, 52.0, 47.0, 39.0, 39.0, 1062.0, 53.0, 36.0, 34.0, 32.0, 31.0, 30.0, 31.0, 29.0, 30.0, 18.0, 19.0, 29.0, 15.0, 17.0, 11.0, 9.0, 10.0, 7.0, 8.0, 6.0, 8.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-3.68359375, -3.5667724609375, -3.449951171875, -3.3331298828125, -3.21630859375, -3.0994873046875, -2.982666015625, -2.8658447265625, -2.7490234375, -2.6322021484375, -2.515380859375, -2.3985595703125, -2.28173828125, -2.1649169921875, -2.048095703125, -1.9312744140625, -1.814453125, -1.6976318359375, -1.580810546875, -1.4639892578125, -1.34716796875, -1.2303466796875, -1.113525390625, -0.9967041015625, -0.8798828125, -0.7630615234375, -0.646240234375, -0.5294189453125, -0.41259765625, -0.2957763671875, -0.178955078125, -0.0621337890625, 0.0546875, 0.1715087890625, 0.288330078125, 0.4051513671875, 0.52197265625, 0.6387939453125, 0.755615234375, 0.8724365234375, 0.9892578125, 1.1060791015625, 1.222900390625, 1.3397216796875, 1.45654296875, 1.5733642578125, 1.690185546875, 1.8070068359375, 1.923828125, 2.0406494140625, 2.157470703125, 2.2742919921875, 2.39111328125, 2.5079345703125, 2.624755859375, 2.7415771484375, 2.8583984375, 2.9752197265625, 3.092041015625, 3.2088623046875, 3.32568359375, 3.4425048828125, 3.559326171875, 3.6761474609375, 3.79296875]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 6.0, 5.0, 11.0, 11.0, 21.0, 29.0, 47.0, 68.0, 106.0, 142.0, 190.0, 294.0, 462.0, 649.0, 992.0, 1438.0, 2024.0, 3282.0, 4831.0, 7388.0, 11443.0, 17802.0, 27813.0, 42292.0, 63006.0, 92200.0, 124137.0, 1102220.0, 231806.0, 114915.0, 82857.0, 57197.0, 37912.0, 24475.0, 15659.0, 10151.0, 6425.0, 4278.0, 2831.0, 1853.0, 1235.0, 874.0, 546.0, 403.0, 285.0, 157.0, 113.0, 77.0, 59.0, 47.0, 20.0, 19.0, 16.0, 10.0, 2.0, 4.0, 2.0, 3.0, 2.0, 2.0, 2.0], "bins": [-0.28369140625, -0.27449798583984375, -0.2653045654296875, -0.25611114501953125, -0.246917724609375, -0.23772430419921875, -0.2285308837890625, -0.21933746337890625, -0.21014404296875, -0.20095062255859375, -0.1917572021484375, -0.18256378173828125, -0.173370361328125, -0.16417694091796875, -0.1549835205078125, -0.14579010009765625, -0.1365966796875, -0.12740325927734375, -0.1182098388671875, -0.10901641845703125, -0.099822998046875, -0.09062957763671875, -0.0814361572265625, -0.07224273681640625, -0.06304931640625, -0.05385589599609375, -0.0446624755859375, -0.03546905517578125, -0.026275634765625, -0.01708221435546875, -0.0078887939453125, 0.00130462646484375, 0.010498046875, 0.01969146728515625, 0.0288848876953125, 0.03807830810546875, 0.047271728515625, 0.05646514892578125, 0.0656585693359375, 0.07485198974609375, 0.08404541015625, 0.09323883056640625, 0.1024322509765625, 0.11162567138671875, 0.120819091796875, 0.13001251220703125, 0.1392059326171875, 0.14839935302734375, 0.1575927734375, 0.16678619384765625, 0.1759796142578125, 0.18517303466796875, 0.194366455078125, 0.20355987548828125, 0.2127532958984375, 0.22194671630859375, 0.23114013671875, 0.24033355712890625, 0.2495269775390625, 0.25872039794921875, 0.267913818359375, 0.27710723876953125, 0.2863006591796875, 0.29549407958984375, 0.3046875]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 9.0, 9.0, 7.0, 13.0, 18.0, 22.0, 18.0, 26.0, 33.0, 56.0, 72.0, 95.0, 107.0, 97.0, 97.0, 73.0, 61.0, 49.0, 33.0, 29.0, 25.0, 8.0, 12.0, 6.0, 3.0, 10.0, 6.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00888824462890625, -0.008611202239990234, -0.008334159851074219, -0.008057117462158203, -0.0077800750732421875, -0.007503032684326172, -0.007225990295410156, -0.006948947906494141, -0.006671905517578125, -0.006394863128662109, -0.006117820739746094, -0.005840778350830078, -0.0055637359619140625, -0.005286693572998047, -0.005009651184082031, -0.004732608795166016, -0.00445556640625, -0.004178524017333984, -0.0039014816284179688, -0.003624439239501953, -0.0033473968505859375, -0.003070354461669922, -0.0027933120727539062, -0.0025162696838378906, -0.002239227294921875, -0.0019621849060058594, -0.0016851425170898438, -0.0014081001281738281, -0.0011310577392578125, -0.0008540153503417969, -0.0005769729614257812, -0.0002999305725097656, -2.288818359375e-05, 0.0002541542053222656, 0.0005311965942382812, 0.0008082389831542969, 0.0010852813720703125, 0.0013623237609863281, 0.0016393661499023438, 0.0019164085388183594, 0.002193450927734375, 0.0024704933166503906, 0.0027475357055664062, 0.003024578094482422, 0.0033016204833984375, 0.003578662872314453, 0.0038557052612304688, 0.004132747650146484, 0.0044097900390625, 0.004686832427978516, 0.004963874816894531, 0.005240917205810547, 0.0055179595947265625, 0.005795001983642578, 0.006072044372558594, 0.006349086761474609, 0.006626129150390625, 0.006903171539306641, 0.007180213928222656, 0.007457256317138672, 0.0077342987060546875, 0.008011341094970703, 0.008288383483886719, 0.008565425872802734, 0.00884246826171875]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 7.0, 5.0, 10.0, 10.0, 13.0, 21.0, 26.0, 39.0, 65.0, 88.0, 103.0, 164.0, 251.0, 572.0, 12647.0, 1029633.0, 3703.0, 472.0, 214.0, 141.0, 97.0, 74.0, 57.0, 42.0, 34.0, 22.0, 10.0, 15.0, 8.0, 3.0, 1.0, 2.0, 1.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1651611328125, -0.1600627899169922, -0.15496444702148438, -0.14986610412597656, -0.14476776123046875, -0.13966941833496094, -0.13457107543945312, -0.1294727325439453, -0.1243743896484375, -0.11927604675292969, -0.11417770385742188, -0.10907936096191406, -0.10398101806640625, -0.09888267517089844, -0.09378433227539062, -0.08868598937988281, -0.083587646484375, -0.07848930358886719, -0.07339096069335938, -0.06829261779785156, -0.06319427490234375, -0.05809593200683594, -0.052997589111328125, -0.04789924621582031, -0.0428009033203125, -0.03770256042480469, -0.032604217529296875, -0.027505874633789062, -0.02240753173828125, -0.017309188842773438, -0.012210845947265625, -0.0071125030517578125, -0.00201416015625, 0.0030841827392578125, 0.008182525634765625, 0.013280868530273438, 0.01837921142578125, 0.023477554321289062, 0.028575897216796875, 0.03367424011230469, 0.0387725830078125, 0.04387092590332031, 0.048969268798828125, 0.05406761169433594, 0.05916595458984375, 0.06426429748535156, 0.06936264038085938, 0.07446098327636719, 0.079559326171875, 0.08465766906738281, 0.08975601196289062, 0.09485435485839844, 0.09995269775390625, 0.10505104064941406, 0.11014938354492188, 0.11524772644042969, 0.1203460693359375, 0.1254444122314453, 0.13054275512695312, 0.13564109802246094, 0.14073944091796875, 0.14583778381347656, 0.15093612670898438, 0.1560344696044922, 0.1611328125]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 9.0, 57.0, 365.0, 455.0, 116.0, 14.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005142928101122379, -0.004581226501613855, -0.004019524902105331, -0.00345782283693552, -0.0028961212374269962, -0.0023344196379184723, -0.0017727178055793047, -0.001211015973240137, -0.0006493143737316132, -8.761265780776739e-05, 0.0004740890581160784, 0.0010357907740399241, 0.00159749248996377, 0.002159194089472294, 0.0027208959218114614, 0.003282597754150629, 0.003844299353659153, 0.004406000953167677, 0.004967702552676201, 0.005529404617846012, 0.006091106217354536, 0.00665280781686306, 0.007214509882032871, 0.007776211481541395, 0.008337913081049919, 0.00889961514621973, 0.009461316280066967, 0.010023018345236778, 0.010584719479084015, 0.011146421544253826, 0.011708123609423637, 0.012269824743270874, 0.01283152587711811, 0.013393227942287922, 0.013954929076135159, 0.01451663114130497, 0.015078332275152206, 0.015640035271644592, 0.01620173640549183, 0.016763437539339066, 0.01732514053583145, 0.017886841669678688, 0.018448544666171074, 0.01901024580001831, 0.019571946933865547, 0.020133648067712784, 0.02069535106420517, 0.021257052198052406, 0.021818753331899643, 0.02238045446574688, 0.022942157462239265, 0.023503858596086502, 0.02406555972993374, 0.024627260863780975, 0.02518896386027336, 0.025750664994120598, 0.026312366127967834, 0.02687406726181507, 0.027435770258307457, 0.027997471392154694, 0.02855917252600193, 0.029120873659849167, 0.029682576656341553, 0.03024427779018879, 0.030805980786681175]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 1.0, 5.0, 11.0, 10.0, 15.0, 18.0, 10.0, 18.0, 18.0, 23.0, 22.0, 30.0, 25.0, 30.0, 31.0, 37.0, 27.0, 36.0, 33.0, 36.0, 46.0, 44.0, 51.0, 35.0, 44.0, 31.0, 38.0, 23.0, 27.0, 33.0, 31.0, 16.0, 17.0, 21.0, 18.0, 16.0, 17.0, 11.0, 16.0, 7.0, 9.0, 3.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0032578706741333008, -0.0031544817611575127, -0.0030510928481817245, -0.0029477039352059364, -0.0028443150222301483, -0.00274092610925436, -0.002637537196278572, -0.002534148283302784, -0.002430759370326996, -0.0023273704573512077, -0.0022239815443754196, -0.0021205926313996315, -0.0020172037184238434, -0.0019138148054480553, -0.0018104258924722672, -0.001707036979496479, -0.001603648066520691, -0.0015002591535449028, -0.0013968702405691147, -0.0012934813275933266, -0.0011900924146175385, -0.0010867035016417503, -0.0009833145886659622, -0.0008799256756901741, -0.000776536762714386, -0.0006731478497385979, -0.0005697589367628098, -0.00046637002378702164, -0.0003629811108112335, -0.0002595921978354454, -0.0001562032848596573, -5.281437188386917e-05, 5.0574541091918945e-05, 0.00015396345406770706, 0.0002573523670434952, 0.0003607412800192833, 0.0004641301929950714, 0.0005675191059708595, 0.0006709080189466476, 0.0007742969319224358, 0.0008776858448982239, 0.000981074757874012, 0.0010844636708498001, 0.0011878525838255882, 0.0012912414968013763, 0.0013946304097771645, 0.0014980193227529526, 0.0016014082357287407, 0.0017047971487045288, 0.001808186061680317, 0.001911574974656105, 0.002014963887631893, 0.0021183528006076813, 0.0022217417135834694, 0.0023251306265592575, 0.0024285195395350456, 0.0025319084525108337, 0.002635297365486622, 0.00273868627846241, 0.002842075191438198, 0.002945464104413986, 0.0030488530173897743, 0.0031522419303655624, 0.0032556308433413506, 0.0033590197563171387]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 5.0, 6.0, 6.0, 12.0, 8.0, 14.0, 9.0, 13.0, 15.0, 15.0, 16.0, 21.0, 22.0, 27.0, 41.0, 19.0, 30.0, 49.0, 36.0, 39.0, 44.0, 43.0, 37.0, 37.0, 40.0, 46.0, 38.0, 25.0, 29.0, 34.0, 28.0, 27.0, 23.0, 25.0, 21.0, 13.0, 12.0, 17.0, 18.0, 8.0, 12.0, 6.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0], "bins": [-5.671875, -5.5020751953125, -5.332275390625, -5.1624755859375, -4.99267578125, -4.8228759765625, -4.653076171875, -4.4832763671875, -4.3134765625, -4.1436767578125, -3.973876953125, -3.8040771484375, -3.63427734375, -3.4644775390625, -3.294677734375, -3.1248779296875, -2.955078125, -2.7852783203125, -2.615478515625, -2.4456787109375, -2.27587890625, -2.1060791015625, -1.936279296875, -1.7664794921875, -1.5966796875, -1.4268798828125, -1.257080078125, -1.0872802734375, -0.91748046875, -0.7476806640625, -0.577880859375, -0.4080810546875, -0.23828125, -0.0684814453125, 0.101318359375, 0.2711181640625, 0.44091796875, 0.6107177734375, 0.780517578125, 0.9503173828125, 1.1201171875, 1.2899169921875, 1.459716796875, 1.6295166015625, 1.79931640625, 1.9691162109375, 2.138916015625, 2.3087158203125, 2.478515625, 2.6483154296875, 2.818115234375, 2.9879150390625, 3.15771484375, 3.3275146484375, 3.497314453125, 3.6671142578125, 3.8369140625, 4.0067138671875, 4.176513671875, 4.3463134765625, 4.51611328125, 4.6859130859375, 4.855712890625, 5.0255126953125, 5.1953125]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 4.0, 8.0, 11.0, 11.0, 14.0, 28.0, 24.0, 47.0, 52.0, 80.0, 109.0, 153.0, 186.0, 320.0, 501.0, 747.0, 1278.0, 2504.0, 4817.0, 10963.0, 28373.0, 83692.0, 273925.0, 418463.0, 144343.0, 46238.0, 16974.0, 6953.0, 3279.0, 1630.0, 957.0, 616.0, 379.0, 271.0, 148.0, 122.0, 103.0, 64.0, 54.0, 37.0, 34.0, 12.0, 9.0, 6.0, 4.0, 6.0, 5.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0], "bins": [-5.90625, -5.728515625, -5.55078125, -5.373046875, -5.1953125, -5.017578125, -4.83984375, -4.662109375, -4.484375, -4.306640625, -4.12890625, -3.951171875, -3.7734375, -3.595703125, -3.41796875, -3.240234375, -3.0625, -2.884765625, -2.70703125, -2.529296875, -2.3515625, -2.173828125, -1.99609375, -1.818359375, -1.640625, -1.462890625, -1.28515625, -1.107421875, -0.9296875, -0.751953125, -0.57421875, -0.396484375, -0.21875, -0.041015625, 0.13671875, 0.314453125, 0.4921875, 0.669921875, 0.84765625, 1.025390625, 1.203125, 1.380859375, 1.55859375, 1.736328125, 1.9140625, 2.091796875, 2.26953125, 2.447265625, 2.625, 2.802734375, 2.98046875, 3.158203125, 3.3359375, 3.513671875, 3.69140625, 3.869140625, 4.046875, 4.224609375, 4.40234375, 4.580078125, 4.7578125, 4.935546875, 5.11328125, 5.291015625, 5.46875]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 5.0, 3.0, 5.0, 5.0, 7.0, 6.0, 16.0, 12.0, 14.0, 12.0, 22.0, 19.0, 28.0, 36.0, 28.0, 38.0, 44.0, 31.0, 46.0, 51.0, 94.0, 323.0, 1578.0, 146.0, 68.0, 43.0, 36.0, 31.0, 43.0, 36.0, 30.0, 27.0, 28.0, 19.0, 17.0, 21.0, 14.0, 14.0, 12.0, 11.0, 6.0, 5.0, 8.0, 3.0, 4.0, 1.0, 4.0, 4.0, 4.0, 1.0, 0.0, 1.0], "bins": [-20.8125, -20.203857421875, -19.59521484375, -18.986572265625, -18.3779296875, -17.769287109375, -17.16064453125, -16.552001953125, -15.943359375, -15.334716796875, -14.72607421875, -14.117431640625, -13.5087890625, -12.900146484375, -12.29150390625, -11.682861328125, -11.07421875, -10.465576171875, -9.85693359375, -9.248291015625, -8.6396484375, -8.031005859375, -7.42236328125, -6.813720703125, -6.205078125, -5.596435546875, -4.98779296875, -4.379150390625, -3.7705078125, -3.161865234375, -2.55322265625, -1.944580078125, -1.3359375, -0.727294921875, -0.11865234375, 0.489990234375, 1.0986328125, 1.707275390625, 2.31591796875, 2.924560546875, 3.533203125, 4.141845703125, 4.75048828125, 5.359130859375, 5.9677734375, 6.576416015625, 7.18505859375, 7.793701171875, 8.40234375, 9.010986328125, 9.61962890625, 10.228271484375, 10.8369140625, 11.445556640625, 12.05419921875, 12.662841796875, 13.271484375, 13.880126953125, 14.48876953125, 15.097412109375, 15.7060546875, 16.314697265625, 16.92333984375, 17.531982421875, 18.140625]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 5.0, 4.0, 2.0, 1.0, 5.0, 8.0, 8.0, 8.0, 6.0, 14.0, 16.0, 17.0, 17.0, 23.0, 25.0, 34.0, 36.0, 39.0, 68.0, 75.0, 133.0, 232.0, 519.0, 1568.0, 15674.0, 3065634.0, 57782.0, 2382.0, 613.0, 252.0, 122.0, 89.0, 47.0, 45.0, 37.0, 31.0, 32.0, 18.0, 14.0, 16.0, 17.0, 11.0, 8.0, 3.0, 5.0, 4.0, 5.0, 3.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.34375, -37.00439453125, -35.6650390625, -34.32568359375, -32.986328125, -31.64697265625, -30.3076171875, -28.96826171875, -27.62890625, -26.28955078125, -24.9501953125, -23.61083984375, -22.271484375, -20.93212890625, -19.5927734375, -18.25341796875, -16.9140625, -15.57470703125, -14.2353515625, -12.89599609375, -11.556640625, -10.21728515625, -8.8779296875, -7.53857421875, -6.19921875, -4.85986328125, -3.5205078125, -2.18115234375, -0.841796875, 0.49755859375, 1.8369140625, 3.17626953125, 4.515625, 5.85498046875, 7.1943359375, 8.53369140625, 9.873046875, 11.21240234375, 12.5517578125, 13.89111328125, 15.23046875, 16.56982421875, 17.9091796875, 19.24853515625, 20.587890625, 21.92724609375, 23.2666015625, 24.60595703125, 25.9453125, 27.28466796875, 28.6240234375, 29.96337890625, 31.302734375, 32.64208984375, 33.9814453125, 35.32080078125, 36.66015625, 37.99951171875, 39.3388671875, 40.67822265625, 42.017578125, 43.35693359375, 44.6962890625, 46.03564453125, 47.375]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [120.0, 896.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.795110702514648, -2.379739761352539, 8.03563117980957, 18.45100212097168, 28.86637306213379, 39.28174591064453, 49.697113037109375, 60.11248016357422, 70.5278549194336, 80.94322204589844, 91.35859680175781, 101.77397155761719, 112.18933868408203, 122.60470581054688, 133.02008056640625, 143.43545532226562, 153.850830078125, 164.26620483398438, 174.68157958984375, 185.09693908691406, 195.51231384277344, 205.9276885986328, 216.34304809570312, 226.7584228515625, 237.17379760742188, 247.58917236328125, 258.0045471191406, 268.419921875, 278.83526611328125, 289.2506408691406, 299.666015625, 310.0813903808594, 320.49676513671875, 330.9121398925781, 341.3275146484375, 351.7428894042969, 362.15826416015625, 372.5736083984375, 382.9889831542969, 393.40435791015625, 403.8197326660156, 414.235107421875, 424.6504821777344, 435.06585693359375, 445.481201171875, 455.8965759277344, 466.31195068359375, 476.7273254394531, 487.1427001953125, 497.5580749511719, 507.97344970703125, 518.3887939453125, 528.80419921875, 539.2195434570312, 549.6349487304688, 560.05029296875, 570.4656982421875, 580.8810424804688, 591.2964477539062, 601.7117919921875, 612.127197265625, 622.5425415039062, 632.9579467773438, 643.373291015625, 653.7886352539062]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 4.0, 3.0, 6.0, 6.0, 8.0, 10.0, 11.0, 12.0, 9.0, 18.0, 13.0, 21.0, 22.0, 25.0, 23.0, 30.0, 30.0, 19.0, 24.0, 30.0, 36.0, 36.0, 36.0, 34.0, 48.0, 36.0, 43.0, 33.0, 39.0, 24.0, 33.0, 31.0, 35.0, 31.0, 27.0, 18.0, 19.0, 18.0, 20.0, 12.0, 14.0, 10.0, 12.0, 8.0, 7.0, 7.0, 6.0, 7.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-58.83184051513672, -56.977657318115234, -55.12347412109375, -53.269290924072266, -51.41510772705078, -49.5609245300293, -47.70674133300781, -45.85255813598633, -43.998374938964844, -42.14419174194336, -40.290008544921875, -38.43582534790039, -36.581642150878906, -34.72745895385742, -32.87327575683594, -31.019092559814453, -29.16490936279297, -27.310726165771484, -25.45654296875, -23.602359771728516, -21.74817657470703, -19.893993377685547, -18.039810180664062, -16.185626983642578, -14.331443786621094, -12.47726058959961, -10.623077392578125, -8.76889419555664, -6.914710998535156, -5.060527801513672, -3.2063446044921875, -1.3521614074707031, 0.5020217895507812, 2.3562049865722656, 4.21038818359375, 6.064571380615234, 7.918754577636719, 9.772937774658203, 11.627120971679688, 13.481304168701172, 15.335487365722656, 17.18967056274414, 19.043853759765625, 20.89803695678711, 22.752220153808594, 24.606403350830078, 26.460586547851562, 28.314769744873047, 30.16895294189453, 32.023136138916016, 33.8773193359375, 35.731502532958984, 37.58568572998047, 39.43986892700195, 41.29405212402344, 43.14823532104492, 45.002418518066406, 46.85660171508789, 48.710784912109375, 50.56496810913086, 52.419151306152344, 54.27333450317383, 56.12751770019531, 57.9817008972168, 59.83588409423828]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 5.0, 9.0, 8.0, 13.0, 6.0, 11.0, 11.0, 16.0, 15.0, 18.0, 15.0, 17.0, 24.0, 30.0, 29.0, 28.0, 38.0, 35.0, 43.0, 33.0, 54.0, 33.0, 41.0, 33.0, 38.0, 52.0, 31.0, 26.0, 38.0, 28.0, 29.0, 24.0, 23.0, 26.0, 22.0, 10.0, 11.0, 18.0, 18.0, 8.0, 5.0, 12.0, 6.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 2.0, 1.0], "bins": [-5.734375, -5.5615234375, -5.388671875, -5.2158203125, -5.04296875, -4.8701171875, -4.697265625, -4.5244140625, -4.3515625, -4.1787109375, -4.005859375, -3.8330078125, -3.66015625, -3.4873046875, -3.314453125, -3.1416015625, -2.96875, -2.7958984375, -2.623046875, -2.4501953125, -2.27734375, -2.1044921875, -1.931640625, -1.7587890625, -1.5859375, -1.4130859375, -1.240234375, -1.0673828125, -0.89453125, -0.7216796875, -0.548828125, -0.3759765625, -0.203125, -0.0302734375, 0.142578125, 0.3154296875, 0.48828125, 0.6611328125, 0.833984375, 1.0068359375, 1.1796875, 1.3525390625, 1.525390625, 1.6982421875, 1.87109375, 2.0439453125, 2.216796875, 2.3896484375, 2.5625, 2.7353515625, 2.908203125, 3.0810546875, 3.25390625, 3.4267578125, 3.599609375, 3.7724609375, 3.9453125, 4.1181640625, 4.291015625, 4.4638671875, 4.63671875, 4.8095703125, 4.982421875, 5.1552734375, 5.328125]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 6.0, 6.0, 6.0, 10.0, 11.0, 11.0, 19.0, 24.0, 29.0, 26.0, 35.0, 39.0, 45.0, 62.0, 77.0, 112.0, 183.0, 384.0, 1013.0, 4329.0, 29695.0, 364511.0, 3191695.0, 554636.0, 39774.0, 5269.0, 1112.0, 408.0, 191.0, 136.0, 86.0, 54.0, 54.0, 52.0, 42.0, 26.0, 25.0, 25.0, 15.0, 9.0, 13.0, 11.0, 4.0, 2.0, 3.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-23.921875, -23.1640625, -22.40625, -21.6484375, -20.890625, -20.1328125, -19.375, -18.6171875, -17.859375, -17.1015625, -16.34375, -15.5859375, -14.828125, -14.0703125, -13.3125, -12.5546875, -11.796875, -11.0390625, -10.28125, -9.5234375, -8.765625, -8.0078125, -7.25, -6.4921875, -5.734375, -4.9765625, -4.21875, -3.4609375, -2.703125, -1.9453125, -1.1875, -0.4296875, 0.328125, 1.0859375, 1.84375, 2.6015625, 3.359375, 4.1171875, 4.875, 5.6328125, 6.390625, 7.1484375, 7.90625, 8.6640625, 9.421875, 10.1796875, 10.9375, 11.6953125, 12.453125, 13.2109375, 13.96875, 14.7265625, 15.484375, 16.2421875, 17.0, 17.7578125, 18.515625, 19.2734375, 20.03125, 20.7890625, 21.546875, 22.3046875, 23.0625, 23.8203125, 24.578125]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 5.0, 5.0, 9.0, 15.0, 20.0, 42.0, 49.0, 80.0, 114.0, 184.0, 257.0, 333.0, 450.0, 519.0, 534.0, 406.0, 362.0, 245.0, 138.0, 109.0, 78.0, 42.0, 28.0, 26.0, 13.0, 7.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.90625, -27.189208984375, -26.47216796875, -25.755126953125, -25.0380859375, -24.321044921875, -23.60400390625, -22.886962890625, -22.169921875, -21.452880859375, -20.73583984375, -20.018798828125, -19.3017578125, -18.584716796875, -17.86767578125, -17.150634765625, -16.43359375, -15.716552734375, -14.99951171875, -14.282470703125, -13.5654296875, -12.848388671875, -12.13134765625, -11.414306640625, -10.697265625, -9.980224609375, -9.26318359375, -8.546142578125, -7.8291015625, -7.112060546875, -6.39501953125, -5.677978515625, -4.9609375, -4.243896484375, -3.52685546875, -2.809814453125, -2.0927734375, -1.375732421875, -0.65869140625, 0.058349609375, 0.775390625, 1.492431640625, 2.20947265625, 2.926513671875, 3.6435546875, 4.360595703125, 5.07763671875, 5.794677734375, 6.51171875, 7.228759765625, 7.94580078125, 8.662841796875, 9.3798828125, 10.096923828125, 10.81396484375, 11.531005859375, 12.248046875, 12.965087890625, 13.68212890625, 14.399169921875, 15.1162109375, 15.833251953125, 16.55029296875, 17.267333984375, 17.984375]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 6.0, 3.0, 8.0, 19.0, 17.0, 39.0, 44.0, 91.0, 162.0, 278.0, 571.0, 1411.0, 4387.0, 21461.0, 173196.0, 2141329.0, 1690668.0, 136287.0, 18007.0, 3877.0, 1271.0, 526.0, 259.0, 161.0, 81.0, 50.0, 34.0, 17.0, 12.0, 5.0, 0.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.25, -26.0625, -24.875, -23.6875, -22.5, -21.3125, -20.125, -18.9375, -17.75, -16.5625, -15.375, -14.1875, -13.0, -11.8125, -10.625, -9.4375, -8.25, -7.0625, -5.875, -4.6875, -3.5, -2.3125, -1.125, 0.0625, 1.25, 2.4375, 3.625, 4.8125, 6.0, 7.1875, 8.375, 9.5625, 10.75, 11.9375, 13.125, 14.3125, 15.5, 16.6875, 17.875, 19.0625, 20.25, 21.4375, 22.625, 23.8125, 25.0, 26.1875, 27.375, 28.5625, 29.75, 30.9375, 32.125, 33.3125, 34.5, 35.6875, 36.875, 38.0625, 39.25, 40.4375, 41.625, 42.8125, 44.0, 45.1875, 46.375, 47.5625, 48.75]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 14.0, 28.0, 51.0, 102.0, 158.0, 204.0, 174.0, 134.0, 84.0, 43.0, 11.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.90666961669922, -59.23860168457031, -54.57053756713867, -49.90247344970703, -45.234405517578125, -40.56633758544922, -35.89827346801758, -31.230209350585938, -26.56214141845703, -21.894075393676758, -17.226009368896484, -12.557943344116211, -7.8898773193359375, -3.221811294555664, 1.4462547302246094, 6.11431884765625, 10.782386779785156, 15.45045280456543, 20.118518829345703, 24.786584854125977, 29.45465087890625, 34.122718811035156, 38.7907829284668, 43.45884704589844, 48.126914978027344, 52.79498291015625, 57.46304702758789, 62.13111114501953, 66.79917907714844, 71.46724700927734, 76.13531494140625, 80.80337524414062, 85.47145080566406, 90.13951873779297, 94.80758666992188, 99.47564697265625, 104.14371490478516, 108.81178283691406, 113.47984313964844, 118.14791107177734, 122.81597900390625, 127.48404693603516, 132.15211486816406, 136.82017517089844, 141.48825073242188, 146.15631103515625, 150.82437133789062, 155.492431640625, 160.16050720214844, 164.8285675048828, 169.49664306640625, 174.16470336914062, 178.832763671875, 183.50083923339844, 188.1688995361328, 192.83697509765625, 197.50503540039062, 202.173095703125, 206.84117126464844, 211.5092315673828, 216.17730712890625, 220.84536743164062, 225.513427734375, 230.18148803710938, 234.8495635986328]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 7.0, 6.0, 14.0, 8.0, 6.0, 11.0, 13.0, 19.0, 13.0, 21.0, 28.0, 24.0, 23.0, 26.0, 29.0, 37.0, 45.0, 35.0, 38.0, 38.0, 27.0, 42.0, 53.0, 34.0, 47.0, 29.0, 24.0, 41.0, 36.0, 33.0, 26.0, 25.0, 25.0, 16.0, 19.0, 13.0, 14.0, 9.0, 10.0, 7.0, 11.0, 11.0, 2.0, 3.0, 1.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.54420471191406, -46.789825439453125, -45.03544998168945, -43.281070709228516, -41.526695251464844, -39.772315979003906, -38.01793670654297, -36.2635612487793, -34.509185791015625, -32.75480651855469, -31.000431060791016, -29.246051788330078, -27.491676330566406, -25.73729705810547, -23.982919692993164, -22.22854232788086, -20.474163055419922, -18.719785690307617, -16.965408325195312, -15.211030006408691, -13.456652641296387, -11.702275276184082, -9.947896957397461, -8.193519592285156, -6.439142227172852, -4.684764862060547, -2.930387020111084, -1.176009178161621, 0.5783681869506836, 2.3327455520629883, 4.087123870849609, 5.841501235961914, 7.595878601074219, 9.350255966186523, 11.104633331298828, 12.85901165008545, 14.613389015197754, 16.367767333984375, 18.12214469909668, 19.876522064208984, 21.63089942932129, 23.385276794433594, 25.1396541595459, 26.894031524658203, 28.64841079711914, 30.402786254882812, 32.15716552734375, 33.91154479980469, 35.66592025756836, 37.4202995300293, 39.17467498779297, 40.929054260253906, 42.68342971801758, 44.437808990478516, 46.19218444824219, 47.946563720703125, 49.70094299316406, 51.455322265625, 53.20969772338867, 54.96407699584961, 56.71845245361328, 58.47283172607422, 60.227210998535156, 61.98158645629883, 63.7359619140625]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 7.0, 10.0, 10.0, 12.0, 7.0, 10.0, 14.0, 17.0, 17.0, 13.0, 15.0, 25.0, 26.0, 33.0, 27.0, 40.0, 32.0, 41.0, 37.0, 34.0, 36.0, 37.0, 45.0, 43.0, 33.0, 33.0, 47.0, 42.0, 34.0, 25.0, 25.0, 21.0, 23.0, 23.0, 24.0, 12.0, 15.0, 10.0, 8.0, 12.0, 8.0, 8.0, 1.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0], "bins": [-6.20703125, -6.02313232421875, -5.8392333984375, -5.65533447265625, -5.471435546875, -5.28753662109375, -5.1036376953125, -4.91973876953125, -4.73583984375, -4.55194091796875, -4.3680419921875, -4.18414306640625, -4.000244140625, -3.81634521484375, -3.6324462890625, -3.44854736328125, -3.2646484375, -3.08074951171875, -2.8968505859375, -2.71295166015625, -2.529052734375, -2.34515380859375, -2.1612548828125, -1.97735595703125, -1.79345703125, -1.60955810546875, -1.4256591796875, -1.24176025390625, -1.057861328125, -0.87396240234375, -0.6900634765625, -0.50616455078125, -0.322265625, -0.13836669921875, 0.0455322265625, 0.22943115234375, 0.413330078125, 0.59722900390625, 0.7811279296875, 0.96502685546875, 1.14892578125, 1.33282470703125, 1.5167236328125, 1.70062255859375, 1.884521484375, 2.06842041015625, 2.2523193359375, 2.43621826171875, 2.6201171875, 2.80401611328125, 2.9879150390625, 3.17181396484375, 3.355712890625, 3.53961181640625, 3.7235107421875, 3.90740966796875, 4.09130859375, 4.27520751953125, 4.4591064453125, 4.64300537109375, 4.826904296875, 5.01080322265625, 5.1947021484375, 5.37860107421875, 5.5625]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 9.0, 11.0, 9.0, 30.0, 33.0, 59.0, 66.0, 131.0, 193.0, 291.0, 472.0, 707.0, 1113.0, 1654.0, 2678.0, 4171.0, 6625.0, 10367.0, 16470.0, 26652.0, 43215.0, 69997.0, 112461.0, 163952.0, 188763.0, 145788.0, 96375.0, 59243.0, 36256.0, 22502.0, 13937.0, 8909.0, 5588.0, 3496.0, 2237.0, 1445.0, 926.0, 596.0, 438.0, 244.0, 162.0, 97.0, 62.0, 50.0, 32.0, 20.0, 13.0, 8.0, 9.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51171875, -0.49588775634765625, -0.4800567626953125, -0.46422576904296875, -0.448394775390625, -0.43256378173828125, -0.4167327880859375, -0.40090179443359375, -0.38507080078125, -0.36923980712890625, -0.3534088134765625, -0.33757781982421875, -0.321746826171875, -0.30591583251953125, -0.2900848388671875, -0.27425384521484375, -0.2584228515625, -0.24259185791015625, -0.2267608642578125, -0.21092987060546875, -0.195098876953125, -0.17926788330078125, -0.1634368896484375, -0.14760589599609375, -0.13177490234375, -0.11594390869140625, -0.1001129150390625, -0.08428192138671875, -0.068450927734375, -0.05261993408203125, -0.0367889404296875, -0.02095794677734375, -0.005126953125, 0.01070404052734375, 0.0265350341796875, 0.04236602783203125, 0.058197021484375, 0.07402801513671875, 0.0898590087890625, 0.10569000244140625, 0.12152099609375, 0.13735198974609375, 0.1531829833984375, 0.16901397705078125, 0.184844970703125, 0.20067596435546875, 0.2165069580078125, 0.23233795166015625, 0.2481689453125, 0.26399993896484375, 0.2798309326171875, 0.29566192626953125, 0.311492919921875, 0.32732391357421875, 0.3431549072265625, 0.35898590087890625, 0.37481689453125, 0.39064788818359375, 0.4064788818359375, 0.42230987548828125, 0.438140869140625, 0.45397186279296875, 0.4698028564453125, 0.48563385009765625, 0.50146484375]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 6.0, 2.0, 7.0, 7.0, 16.0, 15.0, 11.0, 22.0, 27.0, 20.0, 31.0, 29.0, 28.0, 30.0, 50.0, 57.0, 62.0, 47.0, 1084.0, 48.0, 47.0, 41.0, 41.0, 33.0, 39.0, 37.0, 29.0, 28.0, 28.0, 24.0, 18.0, 18.0, 13.0, 13.0, 3.0, 9.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.28515625, -5.13720703125, -4.9892578125, -4.84130859375, -4.693359375, -4.54541015625, -4.3974609375, -4.24951171875, -4.1015625, -3.95361328125, -3.8056640625, -3.65771484375, -3.509765625, -3.36181640625, -3.2138671875, -3.06591796875, -2.91796875, -2.77001953125, -2.6220703125, -2.47412109375, -2.326171875, -2.17822265625, -2.0302734375, -1.88232421875, -1.734375, -1.58642578125, -1.4384765625, -1.29052734375, -1.142578125, -0.99462890625, -0.8466796875, -0.69873046875, -0.55078125, -0.40283203125, -0.2548828125, -0.10693359375, 0.041015625, 0.18896484375, 0.3369140625, 0.48486328125, 0.6328125, 0.78076171875, 0.9287109375, 1.07666015625, 1.224609375, 1.37255859375, 1.5205078125, 1.66845703125, 1.81640625, 1.96435546875, 2.1123046875, 2.26025390625, 2.408203125, 2.55615234375, 2.7041015625, 2.85205078125, 3.0, 3.14794921875, 3.2958984375, 3.44384765625, 3.591796875, 3.73974609375, 3.8876953125, 4.03564453125, 4.18359375]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 7.0, 17.0, 20.0, 24.0, 40.0, 48.0, 85.0, 152.0, 210.0, 333.0, 495.0, 700.0, 1085.0, 1739.0, 2683.0, 4066.0, 6310.0, 9898.0, 15497.0, 23909.0, 36335.0, 54736.0, 79793.0, 111444.0, 164329.0, 1166204.0, 126609.0, 95001.0, 66759.0, 44392.0, 29457.0, 19282.0, 12450.0, 8052.0, 5173.0, 3382.0, 2260.0, 1463.0, 931.0, 594.0, 435.0, 247.0, 173.0, 124.0, 70.0, 45.0, 30.0, 18.0, 11.0, 9.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.30859375, -0.2990264892578125, -0.289459228515625, -0.2798919677734375, -0.27032470703125, -0.2607574462890625, -0.251190185546875, -0.2416229248046875, -0.2320556640625, -0.2224884033203125, -0.212921142578125, -0.2033538818359375, -0.19378662109375, -0.1842193603515625, -0.174652099609375, -0.1650848388671875, -0.155517578125, -0.1459503173828125, -0.136383056640625, -0.1268157958984375, -0.11724853515625, -0.1076812744140625, -0.098114013671875, -0.0885467529296875, -0.0789794921875, -0.0694122314453125, -0.059844970703125, -0.0502777099609375, -0.04071044921875, -0.0311431884765625, -0.021575927734375, -0.0120086669921875, -0.00244140625, 0.0071258544921875, 0.016693115234375, 0.0262603759765625, 0.03582763671875, 0.0453948974609375, 0.054962158203125, 0.0645294189453125, 0.0740966796875, 0.0836639404296875, 0.093231201171875, 0.1027984619140625, 0.11236572265625, 0.1219329833984375, 0.131500244140625, 0.1410675048828125, 0.150634765625, 0.1602020263671875, 0.169769287109375, 0.1793365478515625, 0.18890380859375, 0.1984710693359375, 0.208038330078125, 0.2176055908203125, 0.2271728515625, 0.2367401123046875, 0.246307373046875, 0.2558746337890625, 0.26544189453125, 0.2750091552734375, 0.284576416015625, 0.2941436767578125, 0.3037109375]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 2.0, 8.0, 4.0, 9.0, 4.0, 6.0, 8.0, 13.0, 19.0, 18.0, 19.0, 20.0, 31.0, 32.0, 36.0, 44.0, 54.0, 52.0, 51.0, 50.0, 71.0, 70.0, 44.0, 56.0, 45.0, 38.0, 37.0, 23.0, 23.0, 23.0, 17.0, 12.0, 9.0, 7.0, 10.0, 7.0, 9.0, 5.0, 4.0, 3.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0], "bins": [-0.006557464599609375, -0.006365478038787842, -0.006173491477966309, -0.005981504917144775, -0.005789518356323242, -0.005597531795501709, -0.005405545234680176, -0.005213558673858643, -0.005021572113037109, -0.004829585552215576, -0.004637598991394043, -0.00444561243057251, -0.0042536258697509766, -0.004061639308929443, -0.00386965274810791, -0.003677666187286377, -0.0034856796264648438, -0.0032936930656433105, -0.0031017065048217773, -0.002909719944000244, -0.002717733383178711, -0.0025257468223571777, -0.0023337602615356445, -0.0021417737007141113, -0.0019497871398925781, -0.001757800579071045, -0.0015658140182495117, -0.0013738274574279785, -0.0011818408966064453, -0.0009898543357849121, -0.0007978677749633789, -0.0006058812141418457, -0.0004138946533203125, -0.0002219080924987793, -2.9921531677246094e-05, 0.0001620650291442871, 0.0003540515899658203, 0.0005460381507873535, 0.0007380247116088867, 0.0009300112724304199, 0.0011219978332519531, 0.0013139843940734863, 0.0015059709548950195, 0.0016979575157165527, 0.001889944076538086, 0.002081930637359619, 0.0022739171981811523, 0.0024659037590026855, 0.0026578903198242188, 0.002849876880645752, 0.003041863441467285, 0.0032338500022888184, 0.0034258365631103516, 0.0036178231239318848, 0.003809809684753418, 0.004001796245574951, 0.004193782806396484, 0.004385769367218018, 0.004577755928039551, 0.004769742488861084, 0.004961729049682617, 0.00515371561050415, 0.005345702171325684, 0.005537688732147217, 0.00572967529296875]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 6.0, 6.0, 3.0, 8.0, 9.0, 12.0, 21.0, 23.0, 22.0, 32.0, 38.0, 49.0, 83.0, 111.0, 135.0, 194.0, 310.0, 720.0, 15596.0, 1003730.0, 25527.0, 806.0, 320.0, 201.0, 140.0, 95.0, 73.0, 61.0, 43.0, 28.0, 35.0, 19.0, 22.0, 16.0, 13.0, 14.0, 5.0, 12.0, 6.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.111083984375, -0.10732460021972656, -0.10356521606445312, -0.09980583190917969, -0.09604644775390625, -0.09228706359863281, -0.08852767944335938, -0.08476829528808594, -0.0810089111328125, -0.07724952697753906, -0.07349014282226562, -0.06973075866699219, -0.06597137451171875, -0.06221199035644531, -0.058452606201171875, -0.05469322204589844, -0.050933837890625, -0.04717445373535156, -0.043415069580078125, -0.03965568542480469, -0.03589630126953125, -0.03213691711425781, -0.028377532958984375, -0.024618148803710938, -0.0208587646484375, -0.017099380493164062, -0.013339996337890625, -0.009580612182617188, -0.00582122802734375, -0.0020618438720703125, 0.001697540283203125, 0.0054569244384765625, 0.00921630859375, 0.012975692749023438, 0.016735076904296875, 0.020494461059570312, 0.02425384521484375, 0.028013229370117188, 0.031772613525390625, 0.03553199768066406, 0.0392913818359375, 0.04305076599121094, 0.046810150146484375, 0.05056953430175781, 0.05432891845703125, 0.05808830261230469, 0.061847686767578125, 0.06560707092285156, 0.069366455078125, 0.07312583923339844, 0.07688522338867188, 0.08064460754394531, 0.08440399169921875, 0.08816337585449219, 0.09192276000976562, 0.09568214416503906, 0.0994415283203125, 0.10320091247558594, 0.10696029663085938, 0.11071968078613281, 0.11447906494140625, 0.11823844909667969, 0.12199783325195312, 0.12575721740722656, 0.1295166015625]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [8.0, 201.0, 700.0, 106.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0024994623381644487, -0.0014556304085999727, -0.0004117984790354967, 0.0006320334505289793, 0.0016758653800934553, 0.0027196973096579313, 0.0037635292392224073, 0.004807361401617527, 0.005851193331182003, 0.006895025260746479, 0.007938857190310955, 0.008982689119875431, 0.010026521049439907, 0.011070352979004383, 0.012114184908568859, 0.013158016838133335, 0.014201848767697811, 0.015245680697262287, 0.016289513558149338, 0.017333343625068665, 0.01837717741727829, 0.019421007484197617, 0.020464841276407242, 0.02150867134332657, 0.022552503272891045, 0.02359633520245552, 0.024640167132019997, 0.025683999061584473, 0.02672783099114895, 0.027771662920713425, 0.0288154948502779, 0.029859326779842377, 0.030903160572052002, 0.03194699436426163, 0.032990824431180954, 0.03403465449810028, 0.035078488290309906, 0.03612232208251953, 0.03716615214943886, 0.038209982216358185, 0.03925381600856781, 0.040297649800777435, 0.04134147986769676, 0.04238530993461609, 0.043429143726825714, 0.04447297751903534, 0.045516807585954666, 0.04656063765287399, 0.04760447144508362, 0.04864830523729324, 0.04969213530421257, 0.0507359653711319, 0.05177979916334152, 0.05282363295555115, 0.053867463022470474, 0.0549112930893898, 0.055955126881599426, 0.05699896067380905, 0.05804279074072838, 0.059086620807647705, 0.06013045459985733, 0.061174288392066956, 0.06221811845898628, 0.06326194852590561, 0.06430578231811523]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 4.0, 4.0, 6.0, 8.0, 9.0, 7.0, 11.0, 17.0, 24.0, 20.0, 17.0, 33.0, 23.0, 32.0, 39.0, 30.0, 43.0, 39.0, 53.0, 51.0, 38.0, 43.0, 43.0, 44.0, 48.0, 44.0, 41.0, 36.0, 33.0, 22.0, 19.0, 21.0, 25.0, 14.0, 14.0, 11.0, 14.0, 5.0, 6.0, 7.0, 6.0, 0.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.00412142276763916, -0.004003624431788921, -0.0038858260959386826, -0.0037680277600884438, -0.003650229424238205, -0.003532431088387966, -0.0034146327525377274, -0.0032968344166874886, -0.0031790360808372498, -0.003061237744987011, -0.002943439409136772, -0.0028256410732865334, -0.0027078427374362946, -0.0025900444015860558, -0.002472246065735817, -0.002354447729885578, -0.0022366493940353394, -0.0021188510581851006, -0.0020010527223348618, -0.001883254386484623, -0.0017654560506343842, -0.0016476577147841454, -0.0015298593789339066, -0.0014120610430836678, -0.001294262707233429, -0.0011764643713831902, -0.0010586660355329514, -0.0009408676996827126, -0.0008230693638324738, -0.000705271027982235, -0.0005874726921319962, -0.00046967435628175735, -0.00035187602043151855, -0.00023407768458127975, -0.00011627934873104095, 1.5189871191978455e-06, 0.00011931732296943665, 0.00023711565881967545, 0.00035491399466991425, 0.00047271233052015305, 0.0005905106663703918, 0.0007083090022206306, 0.0008261073380708694, 0.0009439056739211082, 0.001061704009771347, 0.0011795023456215858, 0.0012973006814718246, 0.0014150990173220634, 0.0015328973531723022, 0.001650695689022541, 0.0017684940248727798, 0.0018862923607230186, 0.0020040906965732574, 0.0021218890324234962, 0.002239687368273735, 0.002357485704123974, 0.0024752840399742126, 0.0025930823758244514, 0.0027108807116746902, 0.002828679047524929, 0.002946477383375168, 0.0030642757192254066, 0.0031820740550756454, 0.0032998723909258842, 0.003417670726776123]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 7.0, 10.0, 10.0, 12.0, 7.0, 10.0, 14.0, 17.0, 17.0, 13.0, 15.0, 25.0, 26.0, 33.0, 27.0, 40.0, 32.0, 41.0, 37.0, 34.0, 36.0, 37.0, 45.0, 43.0, 33.0, 33.0, 47.0, 42.0, 34.0, 25.0, 25.0, 21.0, 23.0, 23.0, 24.0, 12.0, 15.0, 10.0, 8.0, 12.0, 8.0, 8.0, 1.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0], "bins": [-6.20703125, -6.02313232421875, -5.8392333984375, -5.65533447265625, -5.471435546875, -5.28753662109375, -5.1036376953125, -4.91973876953125, -4.73583984375, -4.55194091796875, -4.3680419921875, -4.18414306640625, -4.000244140625, -3.81634521484375, -3.6324462890625, -3.44854736328125, -3.2646484375, -3.08074951171875, -2.8968505859375, -2.71295166015625, -2.529052734375, -2.34515380859375, -2.1612548828125, -1.97735595703125, -1.79345703125, -1.60955810546875, -1.4256591796875, -1.24176025390625, -1.057861328125, -0.87396240234375, -0.6900634765625, -0.50616455078125, -0.322265625, -0.13836669921875, 0.0455322265625, 0.22943115234375, 0.413330078125, 0.59722900390625, 0.7811279296875, 0.96502685546875, 1.14892578125, 1.33282470703125, 1.5167236328125, 1.70062255859375, 1.884521484375, 2.06842041015625, 2.2523193359375, 2.43621826171875, 2.6201171875, 2.80401611328125, 2.9879150390625, 3.17181396484375, 3.355712890625, 3.53961181640625, 3.7235107421875, 3.90740966796875, 4.09130859375, 4.27520751953125, 4.4591064453125, 4.64300537109375, 4.826904296875, 5.01080322265625, 5.1947021484375, 5.37860107421875, 5.5625]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 5.0, 3.0, 0.0, 6.0, 9.0, 13.0, 15.0, 12.0, 19.0, 29.0, 39.0, 62.0, 99.0, 155.0, 231.0, 287.0, 528.0, 828.0, 1297.0, 2196.0, 3696.0, 6382.0, 11262.0, 21006.0, 41809.0, 87378.0, 210537.0, 350881.0, 163258.0, 70927.0, 34391.0, 17742.0, 9644.0, 5400.0, 3242.0, 1905.0, 1155.0, 736.0, 441.0, 312.0, 204.0, 136.0, 82.0, 69.0, 43.0, 27.0, 12.0, 29.0, 8.0, 2.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0], "bins": [-4.02734375, -3.89471435546875, -3.7620849609375, -3.62945556640625, -3.496826171875, -3.36419677734375, -3.2315673828125, -3.09893798828125, -2.96630859375, -2.83367919921875, -2.7010498046875, -2.56842041015625, -2.435791015625, -2.30316162109375, -2.1705322265625, -2.03790283203125, -1.9052734375, -1.77264404296875, -1.6400146484375, -1.50738525390625, -1.374755859375, -1.24212646484375, -1.1094970703125, -0.97686767578125, -0.84423828125, -0.71160888671875, -0.5789794921875, -0.44635009765625, -0.313720703125, -0.18109130859375, -0.0484619140625, 0.08416748046875, 0.216796875, 0.34942626953125, 0.4820556640625, 0.61468505859375, 0.747314453125, 0.87994384765625, 1.0125732421875, 1.14520263671875, 1.27783203125, 1.41046142578125, 1.5430908203125, 1.67572021484375, 1.808349609375, 1.94097900390625, 2.0736083984375, 2.20623779296875, 2.3388671875, 2.47149658203125, 2.6041259765625, 2.73675537109375, 2.869384765625, 3.00201416015625, 3.1346435546875, 3.26727294921875, 3.39990234375, 3.53253173828125, 3.6651611328125, 3.79779052734375, 3.930419921875, 4.06304931640625, 4.1956787109375, 4.32830810546875, 4.4609375]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 5.0, 5.0, 6.0, 2.0, 6.0, 8.0, 7.0, 5.0, 8.0, 15.0, 18.0, 20.0, 25.0, 22.0, 28.0, 28.0, 29.0, 34.0, 49.0, 52.0, 43.0, 78.0, 211.0, 1670.0, 157.0, 86.0, 63.0, 37.0, 48.0, 34.0, 39.0, 29.0, 29.0, 25.0, 20.0, 15.0, 24.0, 15.0, 13.0, 15.0, 10.0, 8.0, 2.0, 6.0, 2.0, 1.0, 1.0, 3.0, 0.0, 3.0, 0.0, 2.0, 2.0], "bins": [-24.578125, -23.864501953125, -23.15087890625, -22.437255859375, -21.7236328125, -21.010009765625, -20.29638671875, -19.582763671875, -18.869140625, -18.155517578125, -17.44189453125, -16.728271484375, -16.0146484375, -15.301025390625, -14.58740234375, -13.873779296875, -13.16015625, -12.446533203125, -11.73291015625, -11.019287109375, -10.3056640625, -9.592041015625, -8.87841796875, -8.164794921875, -7.451171875, -6.737548828125, -6.02392578125, -5.310302734375, -4.5966796875, -3.883056640625, -3.16943359375, -2.455810546875, -1.7421875, -1.028564453125, -0.31494140625, 0.398681640625, 1.1123046875, 1.825927734375, 2.53955078125, 3.253173828125, 3.966796875, 4.680419921875, 5.39404296875, 6.107666015625, 6.8212890625, 7.534912109375, 8.24853515625, 8.962158203125, 9.67578125, 10.389404296875, 11.10302734375, 11.816650390625, 12.5302734375, 13.243896484375, 13.95751953125, 14.671142578125, 15.384765625, 16.098388671875, 16.81201171875, 17.525634765625, 18.2392578125, 18.952880859375, 19.66650390625, 20.380126953125, 21.09375]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 2.0, 3.0, 4.0, 10.0, 15.0, 11.0, 13.0, 29.0, 16.0, 21.0, 30.0, 41.0, 48.0, 55.0, 90.0, 145.0, 246.0, 520.0, 1470.0, 10109.0, 1988976.0, 1132684.0, 8590.0, 1348.0, 492.0, 230.0, 140.0, 81.0, 54.0, 52.0, 22.0, 35.0, 25.0, 20.0, 12.0, 15.0, 9.0, 9.0, 6.0, 8.0, 3.0, 5.0, 2.0, 8.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.96875, -34.7685546875, -33.568359375, -32.3681640625, -31.16796875, -29.9677734375, -28.767578125, -27.5673828125, -26.3671875, -25.1669921875, -23.966796875, -22.7666015625, -21.56640625, -20.3662109375, -19.166015625, -17.9658203125, -16.765625, -15.5654296875, -14.365234375, -13.1650390625, -11.96484375, -10.7646484375, -9.564453125, -8.3642578125, -7.1640625, -5.9638671875, -4.763671875, -3.5634765625, -2.36328125, -1.1630859375, 0.037109375, 1.2373046875, 2.4375, 3.6376953125, 4.837890625, 6.0380859375, 7.23828125, 8.4384765625, 9.638671875, 10.8388671875, 12.0390625, 13.2392578125, 14.439453125, 15.6396484375, 16.83984375, 18.0400390625, 19.240234375, 20.4404296875, 21.640625, 22.8408203125, 24.041015625, 25.2412109375, 26.44140625, 27.6416015625, 28.841796875, 30.0419921875, 31.2421875, 32.4423828125, 33.642578125, 34.8427734375, 36.04296875, 37.2431640625, 38.443359375, 39.6435546875, 40.84375]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 13.0, 56.0, 178.0, 318.0, 300.0, 97.0, 43.0, 7.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-87.60333251953125, -85.28251647949219, -82.9616928100586, -80.640869140625, -78.32005310058594, -75.99923706054688, -73.67841339111328, -71.35758972167969, -69.03677368164062, -66.71595764160156, -64.39513397216797, -62.07431411743164, -59.75349426269531, -57.432674407958984, -55.111854553222656, -52.79103469848633, -50.47021484375, -48.14939498901367, -45.828575134277344, -43.507755279541016, -41.18693542480469, -38.86611557006836, -36.54529571533203, -34.2244758605957, -31.903656005859375, -29.582836151123047, -27.26201629638672, -24.94119644165039, -22.620376586914062, -20.299556732177734, -17.978736877441406, -15.657917022705078, -13.337089538574219, -11.01626968383789, -8.695449829101562, -6.374629974365234, -4.053810119628906, -1.7329902648925781, 0.58782958984375, 2.908649444580078, 5.229469299316406, 7.550289154052734, 9.871109008789062, 12.19192886352539, 14.512748718261719, 16.833568572998047, 19.154388427734375, 21.475208282470703, 23.79602813720703, 26.11684799194336, 28.437667846679688, 30.758487701416016, 33.079307556152344, 35.40012741088867, 37.720947265625, 40.04176712036133, 42.362586975097656, 44.683406829833984, 47.00422668457031, 49.32504653930664, 51.64586639404297, 53.9666862487793, 56.287506103515625, 58.60832595825195, 60.92914581298828]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 5.0, 3.0, 4.0, 8.0, 6.0, 10.0, 14.0, 16.0, 25.0, 28.0, 25.0, 35.0, 40.0, 28.0, 32.0, 32.0, 36.0, 53.0, 47.0, 46.0, 41.0, 52.0, 49.0, 36.0, 38.0, 30.0, 35.0, 28.0, 30.0, 28.0, 25.0, 23.0, 16.0, 18.0, 17.0, 8.0, 8.0, 11.0, 5.0, 8.0, 4.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-78.84596252441406, -76.44082641601562, -74.03568267822266, -71.63054656982422, -69.22541046142578, -66.82026672363281, -64.41513061523438, -62.00999450683594, -59.604854583740234, -57.19971466064453, -54.794578552246094, -52.38943862915039, -49.98429870605469, -47.57916259765625, -45.17402267456055, -42.768882751464844, -40.363746643066406, -37.9586067199707, -35.553470611572266, -33.14833068847656, -30.743192672729492, -28.338054656982422, -25.93291473388672, -23.52777671813965, -21.122638702392578, -18.717500686645508, -16.312362670898438, -13.907222747802734, -11.502084732055664, -9.096946716308594, -6.691807746887207, -4.28666877746582, -1.8815383911132812, 0.5236001014709473, 2.928738594055176, 5.333877086639404, 7.739015579223633, 10.144153594970703, 12.54929256439209, 14.954431533813477, 17.359569549560547, 19.764707565307617, 22.169845581054688, 24.57498550415039, 26.98012351989746, 29.38526153564453, 31.790401458740234, 34.19554138183594, 36.600677490234375, 39.00581741333008, 41.410953521728516, 43.81609344482422, 46.221229553222656, 48.62636947631836, 51.03150939941406, 53.4366455078125, 55.8417854309082, 58.246925354003906, 60.652061462402344, 63.05720138549805, 65.46234130859375, 67.86747741699219, 70.27261352539062, 72.6777572631836, 75.08289337158203]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 11.0, 12.0, 9.0, 10.0, 14.0, 13.0, 14.0, 14.0, 23.0, 27.0, 21.0, 24.0, 21.0, 47.0, 37.0, 40.0, 40.0, 41.0, 33.0, 47.0, 43.0, 39.0, 42.0, 44.0, 37.0, 47.0, 30.0, 36.0, 20.0, 30.0, 18.0, 21.0, 17.0, 13.0, 16.0, 8.0, 8.0, 13.0, 4.0, 3.0, 4.0, 6.0, 3.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.625, -6.423095703125, -6.22119140625, -6.019287109375, -5.8173828125, -5.615478515625, -5.41357421875, -5.211669921875, -5.009765625, -4.807861328125, -4.60595703125, -4.404052734375, -4.2021484375, -4.000244140625, -3.79833984375, -3.596435546875, -3.39453125, -3.192626953125, -2.99072265625, -2.788818359375, -2.5869140625, -2.385009765625, -2.18310546875, -1.981201171875, -1.779296875, -1.577392578125, -1.37548828125, -1.173583984375, -0.9716796875, -0.769775390625, -0.56787109375, -0.365966796875, -0.1640625, 0.037841796875, 0.23974609375, 0.441650390625, 0.6435546875, 0.845458984375, 1.04736328125, 1.249267578125, 1.451171875, 1.653076171875, 1.85498046875, 2.056884765625, 2.2587890625, 2.460693359375, 2.66259765625, 2.864501953125, 3.06640625, 3.268310546875, 3.47021484375, 3.672119140625, 3.8740234375, 4.075927734375, 4.27783203125, 4.479736328125, 4.681640625, 4.883544921875, 5.08544921875, 5.287353515625, 5.4892578125, 5.691162109375, 5.89306640625, 6.094970703125, 6.296875]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 0.0, 8.0, 2.0, 4.0, 8.0, 9.0, 8.0, 9.0, 17.0, 12.0, 22.0, 13.0, 27.0, 22.0, 30.0, 27.0, 62.0, 79.0, 143.0, 302.0, 994.0, 5362.0, 50413.0, 1202341.0, 2793520.0, 127477.0, 10765.0, 1634.0, 406.0, 165.0, 94.0, 63.0, 49.0, 37.0, 32.0, 18.0, 15.0, 19.0, 19.0, 12.0, 9.0, 6.0, 4.0, 8.0, 4.0, 3.0, 4.0, 3.0, 4.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-28.234375, -27.356689453125, -26.47900390625, -25.601318359375, -24.7236328125, -23.845947265625, -22.96826171875, -22.090576171875, -21.212890625, -20.335205078125, -19.45751953125, -18.579833984375, -17.7021484375, -16.824462890625, -15.94677734375, -15.069091796875, -14.19140625, -13.313720703125, -12.43603515625, -11.558349609375, -10.6806640625, -9.802978515625, -8.92529296875, -8.047607421875, -7.169921875, -6.292236328125, -5.41455078125, -4.536865234375, -3.6591796875, -2.781494140625, -1.90380859375, -1.026123046875, -0.1484375, 0.729248046875, 1.60693359375, 2.484619140625, 3.3623046875, 4.239990234375, 5.11767578125, 5.995361328125, 6.873046875, 7.750732421875, 8.62841796875, 9.506103515625, 10.3837890625, 11.261474609375, 12.13916015625, 13.016845703125, 13.89453125, 14.772216796875, 15.64990234375, 16.527587890625, 17.4052734375, 18.282958984375, 19.16064453125, 20.038330078125, 20.916015625, 21.793701171875, 22.67138671875, 23.549072265625, 24.4267578125, 25.304443359375, 26.18212890625, 27.059814453125, 27.9375]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 11.0, 5.0, 9.0, 26.0, 24.0, 49.0, 71.0, 114.0, 169.0, 324.0, 443.0, 627.0, 673.0, 521.0, 374.0, 239.0, 155.0, 90.0, 65.0, 44.0, 21.0, 8.0, 10.0, 5.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-34.71875, -33.89697265625, -33.0751953125, -32.25341796875, -31.431640625, -30.60986328125, -29.7880859375, -28.96630859375, -28.14453125, -27.32275390625, -26.5009765625, -25.67919921875, -24.857421875, -24.03564453125, -23.2138671875, -22.39208984375, -21.5703125, -20.74853515625, -19.9267578125, -19.10498046875, -18.283203125, -17.46142578125, -16.6396484375, -15.81787109375, -14.99609375, -14.17431640625, -13.3525390625, -12.53076171875, -11.708984375, -10.88720703125, -10.0654296875, -9.24365234375, -8.421875, -7.60009765625, -6.7783203125, -5.95654296875, -5.134765625, -4.31298828125, -3.4912109375, -2.66943359375, -1.84765625, -1.02587890625, -0.2041015625, 0.61767578125, 1.439453125, 2.26123046875, 3.0830078125, 3.90478515625, 4.7265625, 5.54833984375, 6.3701171875, 7.19189453125, 8.013671875, 8.83544921875, 9.6572265625, 10.47900390625, 11.30078125, 12.12255859375, 12.9443359375, 13.76611328125, 14.587890625, 15.40966796875, 16.2314453125, 17.05322265625, 17.875]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 7.0, 12.0, 24.0, 51.0, 65.0, 119.0, 185.0, 382.0, 901.0, 3887.0, 47458.0, 1947064.0, 2137218.0, 51071.0, 4039.0, 962.0, 380.0, 204.0, 91.0, 73.0, 28.0, 23.0, 21.0, 7.0, 6.0, 6.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.15625, -39.28662109375, -37.4169921875, -35.54736328125, -33.677734375, -31.80810546875, -29.9384765625, -28.06884765625, -26.19921875, -24.32958984375, -22.4599609375, -20.59033203125, -18.720703125, -16.85107421875, -14.9814453125, -13.11181640625, -11.2421875, -9.37255859375, -7.5029296875, -5.63330078125, -3.763671875, -1.89404296875, -0.0244140625, 1.84521484375, 3.71484375, 5.58447265625, 7.4541015625, 9.32373046875, 11.193359375, 13.06298828125, 14.9326171875, 16.80224609375, 18.671875, 20.54150390625, 22.4111328125, 24.28076171875, 26.150390625, 28.02001953125, 29.8896484375, 31.75927734375, 33.62890625, 35.49853515625, 37.3681640625, 39.23779296875, 41.107421875, 42.97705078125, 44.8466796875, 46.71630859375, 48.5859375, 50.45556640625, 52.3251953125, 54.19482421875, 56.064453125, 57.93408203125, 59.8037109375, 61.67333984375, 63.54296875, 65.41259765625, 67.2822265625, 69.15185546875, 71.021484375, 72.89111328125, 74.7607421875, 76.63037109375, 78.5]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 7.0, 22.0, 31.0, 34.0, 55.0, 74.0, 93.0, 127.0, 113.0, 117.0, 111.0, 84.0, 48.0, 37.0, 29.0, 17.0, 9.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.38624954223633, -59.204132080078125, -56.02201461791992, -52.83989715576172, -49.65777587890625, -46.47566223144531, -43.293540954589844, -40.11142349243164, -36.92930603027344, -33.747188568115234, -30.56507110595703, -27.382951736450195, -24.200834274291992, -21.01871681213379, -17.836597442626953, -14.65447998046875, -11.472362518310547, -8.290245056152344, -5.108126640319824, -1.9260082244873047, 1.2561092376708984, 4.438226699829102, 7.6203460693359375, 10.80246353149414, 13.984580993652344, 17.166698455810547, 20.34881591796875, 23.530935287475586, 26.71305274963379, 29.895170211791992, 33.07728958129883, 36.25940704345703, 39.4415283203125, 42.6236457824707, 45.805763244628906, 48.987884521484375, 52.16999816894531, 55.35211944580078, 58.534236907958984, 61.71635437011719, 64.89846801757812, 68.0805892944336, 71.26270294189453, 74.44482421875, 77.62693786621094, 80.8090591430664, 83.99118041992188, 87.17329406738281, 90.35541534423828, 93.53753662109375, 96.71965026855469, 99.90177154541016, 103.0838851928711, 106.26600646972656, 109.4481201171875, 112.63024139404297, 115.81236267089844, 118.9944839477539, 122.17659759521484, 125.35871887207031, 128.54083251953125, 131.7229461669922, 134.9050750732422, 138.08718872070312, 141.26930236816406]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 2.0, 2.0, 4.0, 12.0, 5.0, 8.0, 11.0, 19.0, 17.0, 23.0, 26.0, 22.0, 33.0, 33.0, 35.0, 40.0, 45.0, 32.0, 50.0, 40.0, 38.0, 43.0, 38.0, 49.0, 48.0, 49.0, 40.0, 44.0, 34.0, 31.0, 20.0, 18.0, 12.0, 21.0, 18.0, 14.0, 8.0, 6.0, 2.0, 7.0, 4.0, 4.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.27806091308594, -59.15653991699219, -57.03501892089844, -54.91349792480469, -52.79197692871094, -50.67045593261719, -48.54893112182617, -46.42741012573242, -44.30588912963867, -42.18436813354492, -40.06284713745117, -37.94132614135742, -35.819801330566406, -33.698280334472656, -31.576759338378906, -29.455238342285156, -27.333717346191406, -25.212196350097656, -23.090675354003906, -20.969152450561523, -18.847631454467773, -16.726110458374023, -14.604588508605957, -12.48306655883789, -10.36154556274414, -8.24002456665039, -6.118502616882324, -3.996981143951416, -1.8754596710205078, 0.2460613250732422, 2.3675832748413086, 4.489105224609375, 6.610626220703125, 8.732147216796875, 10.853669166564941, 12.975191116333008, 15.096712112426758, 17.218233108520508, 19.33975601196289, 21.46127700805664, 23.58279800415039, 25.70431900024414, 27.82583999633789, 29.947362899780273, 32.068885803222656, 34.190406799316406, 36.311927795410156, 38.433448791503906, 40.554969787597656, 42.676490783691406, 44.798011779785156, 46.919532775878906, 49.041053771972656, 51.162574768066406, 53.28409957885742, 55.40562057495117, 57.52714157104492, 59.64866256713867, 61.77018356323242, 63.89170455932617, 66.01322937011719, 68.13475036621094, 70.25627136230469, 72.37779235839844, 74.49931335449219]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 2.0, 3.0, 11.0, 5.0, 12.0, 6.0, 11.0, 17.0, 13.0, 19.0, 10.0, 19.0, 21.0, 29.0, 38.0, 31.0, 49.0, 31.0, 31.0, 41.0, 53.0, 49.0, 37.0, 43.0, 45.0, 44.0, 44.0, 34.0, 44.0, 22.0, 41.0, 24.0, 12.0, 20.0, 20.0, 18.0, 13.0, 14.0, 5.0, 3.0, 6.0, 5.0, 7.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-7.3515625, -7.12908935546875, -6.9066162109375, -6.68414306640625, -6.461669921875, -6.23919677734375, -6.0167236328125, -5.79425048828125, -5.57177734375, -5.34930419921875, -5.1268310546875, -4.90435791015625, -4.681884765625, -4.45941162109375, -4.2369384765625, -4.01446533203125, -3.7919921875, -3.56951904296875, -3.3470458984375, -3.12457275390625, -2.902099609375, -2.67962646484375, -2.4571533203125, -2.23468017578125, -2.01220703125, -1.78973388671875, -1.5672607421875, -1.34478759765625, -1.122314453125, -0.89984130859375, -0.6773681640625, -0.45489501953125, -0.232421875, -0.00994873046875, 0.2125244140625, 0.43499755859375, 0.657470703125, 0.87994384765625, 1.1024169921875, 1.32489013671875, 1.54736328125, 1.76983642578125, 1.9923095703125, 2.21478271484375, 2.437255859375, 2.65972900390625, 2.8822021484375, 3.10467529296875, 3.3271484375, 3.54962158203125, 3.7720947265625, 3.99456787109375, 4.217041015625, 4.43951416015625, 4.6619873046875, 4.88446044921875, 5.10693359375, 5.32940673828125, 5.5518798828125, 5.77435302734375, 5.996826171875, 6.21929931640625, 6.4417724609375, 6.66424560546875, 6.88671875]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 5.0, 3.0, 7.0, 12.0, 18.0, 20.0, 34.0, 56.0, 77.0, 101.0, 151.0, 226.0, 298.0, 435.0, 629.0, 986.0, 1307.0, 2054.0, 2942.0, 4247.0, 6533.0, 9684.0, 14507.0, 22290.0, 34438.0, 52621.0, 81522.0, 123308.0, 164869.0, 164973.0, 123337.0, 81960.0, 53355.0, 34516.0, 22324.0, 14705.0, 9612.0, 6516.0, 4398.0, 2969.0, 1988.0, 1314.0, 964.0, 697.0, 485.0, 350.0, 219.0, 142.0, 119.0, 77.0, 49.0, 42.0, 33.0, 16.0, 10.0, 7.0, 4.0, 4.0, 5.0, 1.0, 2.0], "bins": [-0.49365234375, -0.4782295227050781, -0.46280670166015625, -0.4473838806152344, -0.4319610595703125, -0.4165382385253906, -0.40111541748046875, -0.3856925964355469, -0.370269775390625, -0.3548469543457031, -0.33942413330078125, -0.3240013122558594, -0.3085784912109375, -0.2931556701660156, -0.27773284912109375, -0.2623100280761719, -0.24688720703125, -0.23146438598632812, -0.21604156494140625, -0.20061874389648438, -0.1851959228515625, -0.16977310180664062, -0.15435028076171875, -0.13892745971679688, -0.123504638671875, -0.10808181762695312, -0.09265899658203125, -0.07723617553710938, -0.0618133544921875, -0.046390533447265625, -0.03096771240234375, -0.015544891357421875, -0.0001220703125, 0.015300750732421875, 0.03072357177734375, 0.046146392822265625, 0.0615692138671875, 0.07699203491210938, 0.09241485595703125, 0.10783767700195312, 0.123260498046875, 0.13868331909179688, 0.15410614013671875, 0.16952896118164062, 0.1849517822265625, 0.20037460327148438, 0.21579742431640625, 0.23122024536132812, 0.24664306640625, 0.2620658874511719, 0.27748870849609375, 0.2929115295410156, 0.3083343505859375, 0.3237571716308594, 0.33917999267578125, 0.3546028137207031, 0.370025634765625, 0.3854484558105469, 0.40087127685546875, 0.4162940979003906, 0.4317169189453125, 0.4471397399902344, 0.46256256103515625, 0.4779853820800781, 0.493408203125]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 3.0, 7.0, 8.0, 10.0, 8.0, 10.0, 18.0, 12.0, 13.0, 19.0, 23.0, 24.0, 21.0, 33.0, 26.0, 35.0, 35.0, 29.0, 60.0, 39.0, 31.0, 45.0, 1066.0, 32.0, 35.0, 31.0, 41.0, 39.0, 31.0, 21.0, 40.0, 26.0, 25.0, 19.0, 16.0, 19.0, 10.0, 10.0, 11.0, 10.0, 6.0, 10.0, 6.0, 5.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.25390625, -4.126953125, -4.0, -3.873046875, -3.74609375, -3.619140625, -3.4921875, -3.365234375, -3.23828125, -3.111328125, -2.984375, -2.857421875, -2.73046875, -2.603515625, -2.4765625, -2.349609375, -2.22265625, -2.095703125, -1.96875, -1.841796875, -1.71484375, -1.587890625, -1.4609375, -1.333984375, -1.20703125, -1.080078125, -0.953125, -0.826171875, -0.69921875, -0.572265625, -0.4453125, -0.318359375, -0.19140625, -0.064453125, 0.0625, 0.189453125, 0.31640625, 0.443359375, 0.5703125, 0.697265625, 0.82421875, 0.951171875, 1.078125, 1.205078125, 1.33203125, 1.458984375, 1.5859375, 1.712890625, 1.83984375, 1.966796875, 2.09375, 2.220703125, 2.34765625, 2.474609375, 2.6015625, 2.728515625, 2.85546875, 2.982421875, 3.109375, 3.236328125, 3.36328125, 3.490234375, 3.6171875, 3.744140625, 3.87109375]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 3.0, 5.0, 5.0, 10.0, 15.0, 21.0, 26.0, 52.0, 74.0, 127.0, 178.0, 256.0, 414.0, 647.0, 1045.0, 1547.0, 2406.0, 3725.0, 5839.0, 8997.0, 14081.0, 21812.0, 33786.0, 51747.0, 76492.0, 108886.0, 151490.0, 1180465.0, 133673.0, 99613.0, 69343.0, 46528.0, 29829.0, 19200.0, 12395.0, 8039.0, 5169.0, 3215.0, 2104.0, 1351.0, 875.0, 527.0, 350.0, 246.0, 171.0, 134.0, 67.0, 53.0, 40.0, 21.0, 19.0, 12.0, 6.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.328857421875, -0.3183708190917969, -0.30788421630859375, -0.2973976135253906, -0.2869110107421875, -0.2764244079589844, -0.26593780517578125, -0.2554512023925781, -0.244964599609375, -0.23447799682617188, -0.22399139404296875, -0.21350479125976562, -0.2030181884765625, -0.19253158569335938, -0.18204498291015625, -0.17155838012695312, -0.16107177734375, -0.15058517456054688, -0.14009857177734375, -0.12961196899414062, -0.1191253662109375, -0.10863876342773438, -0.09815216064453125, -0.08766555786132812, -0.077178955078125, -0.06669235229492188, -0.05620574951171875, -0.045719146728515625, -0.0352325439453125, -0.024745941162109375, -0.01425933837890625, -0.003772735595703125, 0.0067138671875, 0.017200469970703125, 0.02768707275390625, 0.038173675537109375, 0.0486602783203125, 0.059146881103515625, 0.06963348388671875, 0.08012008666992188, 0.090606689453125, 0.10109329223632812, 0.11157989501953125, 0.12206649780273438, 0.1325531005859375, 0.14303970336914062, 0.15352630615234375, 0.16401290893554688, 0.17449951171875, 0.18498611450195312, 0.19547271728515625, 0.20595932006835938, 0.2164459228515625, 0.22693252563476562, 0.23741912841796875, 0.24790573120117188, 0.258392333984375, 0.2688789367675781, 0.27936553955078125, 0.2898521423339844, 0.3003387451171875, 0.3108253479003906, 0.32131195068359375, 0.3317985534667969, 0.34228515625]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 5.0, 4.0, 6.0, 5.0, 14.0, 15.0, 26.0, 43.0, 83.0, 120.0, 189.0, 193.0, 125.0, 61.0, 45.0, 26.0, 14.0, 9.0, 7.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0159759521484375, -0.015441179275512695, -0.01490640640258789, -0.014371633529663086, -0.013836860656738281, -0.013302087783813477, -0.012767314910888672, -0.012232542037963867, -0.011697769165039062, -0.011162996292114258, -0.010628223419189453, -0.010093450546264648, -0.009558677673339844, -0.009023904800415039, -0.008489131927490234, -0.00795435905456543, -0.007419586181640625, -0.00688481330871582, -0.006350040435791016, -0.005815267562866211, -0.005280494689941406, -0.0047457218170166016, -0.004210948944091797, -0.003676176071166992, -0.0031414031982421875, -0.002606630325317383, -0.002071857452392578, -0.0015370845794677734, -0.0010023117065429688, -0.00046753883361816406, 6.723403930664062e-05, 0.0006020069122314453, 0.00113677978515625, 0.0016715526580810547, 0.0022063255310058594, 0.002741098403930664, 0.0032758712768554688, 0.0038106441497802734, 0.004345417022705078, 0.004880189895629883, 0.0054149627685546875, 0.005949735641479492, 0.006484508514404297, 0.0070192813873291016, 0.007554054260253906, 0.008088827133178711, 0.008623600006103516, 0.00915837287902832, 0.009693145751953125, 0.01022791862487793, 0.010762691497802734, 0.011297464370727539, 0.011832237243652344, 0.012367010116577148, 0.012901782989501953, 0.013436555862426758, 0.013971328735351562, 0.014506101608276367, 0.015040874481201172, 0.015575647354125977, 0.01611042022705078, 0.016645193099975586, 0.01717996597290039, 0.017714738845825195, 0.01824951171875]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 7.0, 4.0, 2.0, 9.0, 14.0, 15.0, 26.0, 50.0, 94.0, 163.0, 373.0, 2179.0, 1037227.0, 7522.0, 431.0, 215.0, 89.0, 46.0, 29.0, 16.0, 9.0, 4.0, 11.0, 4.0, 3.0, 4.0, 6.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.3095703125, -0.3003578186035156, -0.29114532470703125, -0.2819328308105469, -0.2727203369140625, -0.2635078430175781, -0.25429534912109375, -0.24508285522460938, -0.235870361328125, -0.22665786743164062, -0.21744537353515625, -0.20823287963867188, -0.1990203857421875, -0.18980789184570312, -0.18059539794921875, -0.17138290405273438, -0.16217041015625, -0.15295791625976562, -0.14374542236328125, -0.13453292846679688, -0.1253204345703125, -0.11610794067382812, -0.10689544677734375, -0.09768295288085938, -0.088470458984375, -0.07925796508789062, -0.07004547119140625, -0.060832977294921875, -0.0516204833984375, -0.042407989501953125, -0.03319549560546875, -0.023983001708984375, -0.0147705078125, -0.005558013916015625, 0.00365447998046875, 0.012866973876953125, 0.0220794677734375, 0.031291961669921875, 0.04050445556640625, 0.049716949462890625, 0.058929443359375, 0.06814193725585938, 0.07735443115234375, 0.08656692504882812, 0.0957794189453125, 0.10499191284179688, 0.11420440673828125, 0.12341690063476562, 0.13262939453125, 0.14184188842773438, 0.15105438232421875, 0.16026687622070312, 0.1694793701171875, 0.17869186401367188, 0.18790435791015625, 0.19711685180664062, 0.206329345703125, 0.21554183959960938, 0.22475433349609375, 0.23396682739257812, 0.2431793212890625, 0.2523918151855469, 0.26160430908203125, 0.2708168029785156, 0.280029296875]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 127.0, 591.0, 268.0, 22.0], "bins": [-0.06963048130273819, -0.06850139051675797, -0.06737229973077774, -0.06624321639537811, -0.06511412560939789, -0.06398503482341766, -0.06285594403743744, -0.061726853251457214, -0.06059776619076729, -0.059468675404787064, -0.05833958834409714, -0.05721049755811691, -0.05608140677213669, -0.05495231971144676, -0.05382322892546654, -0.05269414186477661, -0.05156505107879639, -0.05043596029281616, -0.049306873232126236, -0.04817778244614601, -0.047048695385456085, -0.04591960459947586, -0.044790513813495636, -0.04366142302751541, -0.042532335966825485, -0.04140324518084526, -0.040274158120155334, -0.03914506733417511, -0.038015976548194885, -0.03688688948750496, -0.035757798701524734, -0.03462871164083481, -0.033499620854854584, -0.03237053006887436, -0.031241443008184433, -0.03011235222220421, -0.028983263298869133, -0.027854174375534058, -0.026725083589553833, -0.025595994666218758, -0.024466905742883682, -0.023337816819548607, -0.02220872789621353, -0.021079637110233307, -0.01995054818689823, -0.018821459263563156, -0.01769236847758293, -0.016563279554247856, -0.015434189699590206, -0.014305099844932556, -0.01317601092159748, -0.012046921998262405, -0.010917832143604755, -0.009788742288947105, -0.00865965336561203, -0.00753056351095438, -0.006401474587619305, -0.005272385198622942, -0.004143295809626579, -0.0030142064206302166, -0.001885117031633854, -0.0007560276426374912, 0.00037306174635887146, 0.0015021516010165215, 0.002631240524351597]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 2.0, 3.0, 12.0, 10.0, 9.0, 8.0, 10.0, 17.0, 22.0, 27.0, 33.0, 31.0, 40.0, 29.0, 32.0, 46.0, 44.0, 42.0, 41.0, 45.0, 43.0, 42.0, 40.0, 43.0, 52.0, 34.0, 33.0, 29.0, 28.0, 15.0, 27.0, 23.0, 18.0, 22.0, 11.0, 9.0, 4.0, 8.0, 9.0, 5.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.0065416693687438965, -0.00637483224272728, -0.006207995116710663, -0.006041157990694046, -0.005874320864677429, -0.005707483738660812, -0.0055406466126441956, -0.005373809486627579, -0.005206972360610962, -0.005040135234594345, -0.004873298108577728, -0.0047064609825611115, -0.004539623856544495, -0.004372786730527878, -0.004205949604511261, -0.004039112478494644, -0.0038722753524780273, -0.0037054382264614105, -0.0035386011004447937, -0.003371763974428177, -0.00320492684841156, -0.0030380897223949432, -0.0028712525963783264, -0.0027044154703617096, -0.0025375783443450928, -0.002370741218328476, -0.002203904092311859, -0.0020370669662952423, -0.0018702298402786255, -0.0017033927142620087, -0.0015365555882453918, -0.001369718462228775, -0.0012028813362121582, -0.0010360442101955414, -0.0008692070841789246, -0.0007023699581623077, -0.0005355328321456909, -0.0003686957061290741, -0.00020185858011245728, -3.5021454095840454e-05, 0.00013181567192077637, 0.0002986527979373932, 0.00046548992395401, 0.0006323270499706268, 0.0007991641759872437, 0.0009660013020038605, 0.0011328384280204773, 0.0012996755540370941, 0.001466512680053711, 0.0016333498060703278, 0.0018001869320869446, 0.0019670240581035614, 0.0021338611841201782, 0.002300698310136795, 0.002467535436153412, 0.0026343725621700287, 0.0028012096881866455, 0.0029680468142032623, 0.003134883940219879, 0.003301721066236496, 0.003468558192253113, 0.0036353953182697296, 0.0038022324442863464, 0.003969069570302963, 0.00413590669631958]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 2.0, 3.0, 11.0, 5.0, 12.0, 6.0, 11.0, 17.0, 13.0, 19.0, 10.0, 19.0, 21.0, 29.0, 38.0, 31.0, 49.0, 31.0, 31.0, 41.0, 53.0, 49.0, 37.0, 43.0, 45.0, 44.0, 44.0, 34.0, 44.0, 22.0, 41.0, 24.0, 12.0, 20.0, 20.0, 18.0, 13.0, 14.0, 5.0, 3.0, 6.0, 5.0, 7.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-7.3515625, -7.12908935546875, -6.9066162109375, -6.68414306640625, -6.461669921875, -6.23919677734375, -6.0167236328125, -5.79425048828125, -5.57177734375, -5.34930419921875, -5.1268310546875, -4.90435791015625, -4.681884765625, -4.45941162109375, -4.2369384765625, -4.01446533203125, -3.7919921875, -3.56951904296875, -3.3470458984375, -3.12457275390625, -2.902099609375, -2.67962646484375, -2.4571533203125, -2.23468017578125, -2.01220703125, -1.78973388671875, -1.5672607421875, -1.34478759765625, -1.122314453125, -0.89984130859375, -0.6773681640625, -0.45489501953125, -0.232421875, -0.00994873046875, 0.2125244140625, 0.43499755859375, 0.657470703125, 0.87994384765625, 1.1024169921875, 1.32489013671875, 1.54736328125, 1.76983642578125, 1.9923095703125, 2.21478271484375, 2.437255859375, 2.65972900390625, 2.8822021484375, 3.10467529296875, 3.3271484375, 3.54962158203125, 3.7720947265625, 3.99456787109375, 4.217041015625, 4.43951416015625, 4.6619873046875, 4.88446044921875, 5.10693359375, 5.32940673828125, 5.5518798828125, 5.77435302734375, 5.996826171875, 6.21929931640625, 6.4417724609375, 6.66424560546875, 6.88671875]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 6.0, 6.0, 3.0, 11.0, 9.0, 17.0, 31.0, 38.0, 48.0, 80.0, 112.0, 169.0, 229.0, 313.0, 492.0, 883.0, 1367.0, 2311.0, 4296.0, 7964.0, 15826.0, 33149.0, 78689.0, 220297.0, 403425.0, 161946.0, 61294.0, 27051.0, 12922.0, 6675.0, 3513.0, 2069.0, 1176.0, 755.0, 443.0, 317.0, 181.0, 134.0, 93.0, 68.0, 49.0, 24.0, 25.0, 18.0, 14.0, 10.0, 8.0, 4.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.87109375, -3.7296142578125, -3.588134765625, -3.4466552734375, -3.30517578125, -3.1636962890625, -3.022216796875, -2.8807373046875, -2.7392578125, -2.5977783203125, -2.456298828125, -2.3148193359375, -2.17333984375, -2.0318603515625, -1.890380859375, -1.7489013671875, -1.607421875, -1.4659423828125, -1.324462890625, -1.1829833984375, -1.04150390625, -0.9000244140625, -0.758544921875, -0.6170654296875, -0.4755859375, -0.3341064453125, -0.192626953125, -0.0511474609375, 0.09033203125, 0.2318115234375, 0.373291015625, 0.5147705078125, 0.65625, 0.7977294921875, 0.939208984375, 1.0806884765625, 1.22216796875, 1.3636474609375, 1.505126953125, 1.6466064453125, 1.7880859375, 1.9295654296875, 2.071044921875, 2.2125244140625, 2.35400390625, 2.4954833984375, 2.636962890625, 2.7784423828125, 2.919921875, 3.0614013671875, 3.202880859375, 3.3443603515625, 3.48583984375, 3.6273193359375, 3.768798828125, 3.9102783203125, 4.0517578125, 4.1932373046875, 4.334716796875, 4.4761962890625, 4.61767578125, 4.7591552734375, 4.900634765625, 5.0421142578125, 5.18359375]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 4.0, 4.0, 6.0, 11.0, 6.0, 7.0, 11.0, 16.0, 17.0, 19.0, 19.0, 23.0, 26.0, 28.0, 29.0, 42.0, 39.0, 45.0, 47.0, 63.0, 227.0, 1777.0, 118.0, 64.0, 42.0, 46.0, 40.0, 43.0, 34.0, 31.0, 28.0, 30.0, 22.0, 23.0, 13.0, 12.0, 11.0, 9.0, 6.0, 5.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0], "bins": [-28.078125, -27.28271484375, -26.4873046875, -25.69189453125, -24.896484375, -24.10107421875, -23.3056640625, -22.51025390625, -21.71484375, -20.91943359375, -20.1240234375, -19.32861328125, -18.533203125, -17.73779296875, -16.9423828125, -16.14697265625, -15.3515625, -14.55615234375, -13.7607421875, -12.96533203125, -12.169921875, -11.37451171875, -10.5791015625, -9.78369140625, -8.98828125, -8.19287109375, -7.3974609375, -6.60205078125, -5.806640625, -5.01123046875, -4.2158203125, -3.42041015625, -2.625, -1.82958984375, -1.0341796875, -0.23876953125, 0.556640625, 1.35205078125, 2.1474609375, 2.94287109375, 3.73828125, 4.53369140625, 5.3291015625, 6.12451171875, 6.919921875, 7.71533203125, 8.5107421875, 9.30615234375, 10.1015625, 10.89697265625, 11.6923828125, 12.48779296875, 13.283203125, 14.07861328125, 14.8740234375, 15.66943359375, 16.46484375, 17.26025390625, 18.0556640625, 18.85107421875, 19.646484375, 20.44189453125, 21.2373046875, 22.03271484375, 22.828125]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 5.0, 7.0, 9.0, 9.0, 14.0, 9.0, 24.0, 17.0, 30.0, 39.0, 40.0, 47.0, 69.0, 125.0, 213.0, 342.0, 909.0, 5298.0, 922357.0, 2207601.0, 6551.0, 996.0, 344.0, 186.0, 128.0, 78.0, 51.0, 43.0, 31.0, 24.0, 21.0, 16.0, 15.0, 11.0, 14.0, 10.0, 5.0, 6.0, 5.0, 3.0, 1.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.21875, -35.93701171875, -34.6552734375, -33.37353515625, -32.091796875, -30.81005859375, -29.5283203125, -28.24658203125, -26.96484375, -25.68310546875, -24.4013671875, -23.11962890625, -21.837890625, -20.55615234375, -19.2744140625, -17.99267578125, -16.7109375, -15.42919921875, -14.1474609375, -12.86572265625, -11.583984375, -10.30224609375, -9.0205078125, -7.73876953125, -6.45703125, -5.17529296875, -3.8935546875, -2.61181640625, -1.330078125, -0.04833984375, 1.2333984375, 2.51513671875, 3.796875, 5.07861328125, 6.3603515625, 7.64208984375, 8.923828125, 10.20556640625, 11.4873046875, 12.76904296875, 14.05078125, 15.33251953125, 16.6142578125, 17.89599609375, 19.177734375, 20.45947265625, 21.7412109375, 23.02294921875, 24.3046875, 25.58642578125, 26.8681640625, 28.14990234375, 29.431640625, 30.71337890625, 31.9951171875, 33.27685546875, 34.55859375, 35.84033203125, 37.1220703125, 38.40380859375, 39.685546875, 40.96728515625, 42.2490234375, 43.53076171875, 44.8125]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 104.0, 741.0, 163.0, 8.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.85691261291504, -25.356592178344727, -19.856271743774414, -14.355951309204102, -8.855630874633789, -3.3553104400634766, 2.145009994506836, 7.645330429077148, 13.145650863647461, 18.645971298217773, 24.146291732788086, 29.6466121673584, 35.146934509277344, 40.647254943847656, 46.14757537841797, 51.64789581298828, 57.148216247558594, 62.648536682128906, 68.14885711669922, 73.64917755126953, 79.14949798583984, 84.64981842041016, 90.15013885498047, 95.65045928955078, 101.1507797241211, 106.6511001586914, 112.15142059326172, 117.65174102783203, 123.15206146240234, 128.65237426757812, 134.1527099609375, 139.65301513671875, 145.15335083007812, 150.65367126464844, 156.15399169921875, 161.65431213378906, 167.15463256835938, 172.6549530029297, 178.1552734375, 183.6555938720703, 189.15591430664062, 194.65623474121094, 200.15655517578125, 205.65687561035156, 211.15719604492188, 216.6575164794922, 222.1578369140625, 227.6581573486328, 233.15847778320312, 238.65879821777344, 244.15911865234375, 249.65943908691406, 255.15975952148438, 260.66009521484375, 266.160400390625, 271.66070556640625, 277.1610412597656, 282.661376953125, 288.16168212890625, 293.6619873046875, 299.1623229980469, 304.66265869140625, 310.1629638671875, 315.66326904296875, 321.1636047363281]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 7.0, 7.0, 1.0, 8.0, 10.0, 5.0, 7.0, 12.0, 17.0, 19.0, 18.0, 23.0, 23.0, 34.0, 26.0, 26.0, 32.0, 37.0, 36.0, 31.0, 43.0, 30.0, 43.0, 40.0, 34.0, 37.0, 38.0, 23.0, 28.0, 30.0, 29.0, 40.0, 30.0, 24.0, 21.0, 19.0, 21.0, 16.0, 19.0, 12.0, 11.0, 8.0, 10.0, 5.0, 5.0, 2.0, 2.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-73.73575592041016, -71.53121948242188, -69.3266830444336, -67.12214660644531, -64.91761779785156, -62.713077545166016, -60.508544921875, -58.30400848388672, -56.09947204589844, -53.894935607910156, -51.690399169921875, -49.48586654663086, -47.28133010864258, -45.0767936706543, -42.87226104736328, -40.667724609375, -38.46318817138672, -36.25865173339844, -34.054115295410156, -31.84958267211914, -29.64504623413086, -27.440509796142578, -25.23597526550293, -23.03144073486328, -20.826904296875, -18.62236785888672, -16.41783332824707, -14.213297843933105, -12.00876235961914, -9.804226875305176, -7.599691390991211, -5.395155906677246, -3.1906280517578125, -0.9860925674438477, 1.2184429168701172, 3.422978401184082, 5.627513885498047, 7.832049369812012, 10.036584854125977, 12.241120338439941, 14.445655822753906, 16.650192260742188, 18.854726791381836, 21.059261322021484, 23.263797760009766, 25.468334197998047, 27.672868728637695, 29.877403259277344, 32.081939697265625, 34.286476135253906, 36.49101257324219, 38.6955451965332, 40.900081634521484, 43.104618072509766, 45.30915069580078, 47.51368713378906, 49.718223571777344, 51.922760009765625, 54.127296447753906, 56.33182907104492, 58.5363655090332, 60.740901947021484, 62.9454345703125, 65.14997100830078, 67.35450744628906]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 6.0, 6.0, 7.0, 7.0, 12.0, 13.0, 11.0, 14.0, 16.0, 15.0, 20.0, 31.0, 26.0, 34.0, 40.0, 32.0, 44.0, 39.0, 35.0, 50.0, 49.0, 35.0, 44.0, 41.0, 42.0, 45.0, 31.0, 39.0, 35.0, 27.0, 27.0, 25.0, 12.0, 14.0, 21.0, 18.0, 7.0, 10.0, 3.0, 7.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-7.4609375, -7.23419189453125, -7.0074462890625, -6.78070068359375, -6.553955078125, -6.32720947265625, -6.1004638671875, -5.87371826171875, -5.64697265625, -5.42022705078125, -5.1934814453125, -4.96673583984375, -4.739990234375, -4.51324462890625, -4.2864990234375, -4.05975341796875, -3.8330078125, -3.60626220703125, -3.3795166015625, -3.15277099609375, -2.926025390625, -2.69927978515625, -2.4725341796875, -2.24578857421875, -2.01904296875, -1.79229736328125, -1.5655517578125, -1.33880615234375, -1.112060546875, -0.88531494140625, -0.6585693359375, -0.43182373046875, -0.205078125, 0.02166748046875, 0.2484130859375, 0.47515869140625, 0.701904296875, 0.92864990234375, 1.1553955078125, 1.38214111328125, 1.60888671875, 1.83563232421875, 2.0623779296875, 2.28912353515625, 2.515869140625, 2.74261474609375, 2.9693603515625, 3.19610595703125, 3.4228515625, 3.64959716796875, 3.8763427734375, 4.10308837890625, 4.329833984375, 4.55657958984375, 4.7833251953125, 5.01007080078125, 5.23681640625, 5.46356201171875, 5.6903076171875, 5.91705322265625, 6.143798828125, 6.37054443359375, 6.5972900390625, 6.82403564453125, 7.05078125]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 6.0, 3.0, 11.0, 12.0, 21.0, 25.0, 25.0, 45.0, 82.0, 113.0, 213.0, 384.0, 955.0, 2602.0, 8093.0, 31482.0, 152262.0, 1111396.0, 2331537.0, 455523.0, 74169.0, 17488.0, 4794.0, 1622.0, 636.0, 323.0, 168.0, 95.0, 58.0, 31.0, 33.0, 18.0, 11.0, 12.0, 5.0, 3.0, 9.0, 6.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.03125, -16.51953125, -16.0078125, -15.49609375, -14.984375, -14.47265625, -13.9609375, -13.44921875, -12.9375, -12.42578125, -11.9140625, -11.40234375, -10.890625, -10.37890625, -9.8671875, -9.35546875, -8.84375, -8.33203125, -7.8203125, -7.30859375, -6.796875, -6.28515625, -5.7734375, -5.26171875, -4.75, -4.23828125, -3.7265625, -3.21484375, -2.703125, -2.19140625, -1.6796875, -1.16796875, -0.65625, -0.14453125, 0.3671875, 0.87890625, 1.390625, 1.90234375, 2.4140625, 2.92578125, 3.4375, 3.94921875, 4.4609375, 4.97265625, 5.484375, 5.99609375, 6.5078125, 7.01953125, 7.53125, 8.04296875, 8.5546875, 9.06640625, 9.578125, 10.08984375, 10.6015625, 11.11328125, 11.625, 12.13671875, 12.6484375, 13.16015625, 13.671875, 14.18359375, 14.6953125, 15.20703125, 15.71875]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 4.0, 6.0, 5.0, 4.0, 5.0, 14.0, 20.0, 28.0, 22.0, 36.0, 54.0, 66.0, 77.0, 100.0, 153.0, 152.0, 200.0, 285.0, 361.0, 343.0, 401.0, 333.0, 301.0, 244.0, 201.0, 165.0, 125.0, 88.0, 65.0, 49.0, 48.0, 30.0, 20.0, 11.0, 11.0, 15.0, 11.0, 9.0, 4.0, 4.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.109375, -16.6241455078125, -16.138916015625, -15.6536865234375, -15.16845703125, -14.6832275390625, -14.197998046875, -13.7127685546875, -13.2275390625, -12.7423095703125, -12.257080078125, -11.7718505859375, -11.28662109375, -10.8013916015625, -10.316162109375, -9.8309326171875, -9.345703125, -8.8604736328125, -8.375244140625, -7.8900146484375, -7.40478515625, -6.9195556640625, -6.434326171875, -5.9490966796875, -5.4638671875, -4.9786376953125, -4.493408203125, -4.0081787109375, -3.52294921875, -3.0377197265625, -2.552490234375, -2.0672607421875, -1.58203125, -1.0968017578125, -0.611572265625, -0.1263427734375, 0.35888671875, 0.8441162109375, 1.329345703125, 1.8145751953125, 2.2998046875, 2.7850341796875, 3.270263671875, 3.7554931640625, 4.24072265625, 4.7259521484375, 5.211181640625, 5.6964111328125, 6.181640625, 6.6668701171875, 7.152099609375, 7.6373291015625, 8.12255859375, 8.6077880859375, 9.093017578125, 9.5782470703125, 10.0634765625, 10.5487060546875, 11.033935546875, 11.5191650390625, 12.00439453125, 12.4896240234375, 12.974853515625, 13.4600830078125, 13.9453125]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [4.0, 3.0, 1.0, 1.0, 3.0, 1.0, 5.0, 12.0, 7.0, 20.0, 22.0, 36.0, 37.0, 83.0, 109.0, 262.0, 563.0, 1232.0, 3581.0, 14071.0, 74097.0, 576076.0, 2846242.0, 582781.0, 74792.0, 14167.0, 3711.0, 1227.0, 490.0, 258.0, 136.0, 76.0, 60.0, 36.0, 26.0, 18.0, 9.0, 9.0, 9.0, 7.0, 4.0, 4.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.25, -22.216796875, -21.18359375, -20.150390625, -19.1171875, -18.083984375, -17.05078125, -16.017578125, -14.984375, -13.951171875, -12.91796875, -11.884765625, -10.8515625, -9.818359375, -8.78515625, -7.751953125, -6.71875, -5.685546875, -4.65234375, -3.619140625, -2.5859375, -1.552734375, -0.51953125, 0.513671875, 1.546875, 2.580078125, 3.61328125, 4.646484375, 5.6796875, 6.712890625, 7.74609375, 8.779296875, 9.8125, 10.845703125, 11.87890625, 12.912109375, 13.9453125, 14.978515625, 16.01171875, 17.044921875, 18.078125, 19.111328125, 20.14453125, 21.177734375, 22.2109375, 23.244140625, 24.27734375, 25.310546875, 26.34375, 27.376953125, 28.41015625, 29.443359375, 30.4765625, 31.509765625, 32.54296875, 33.576171875, 34.609375, 35.642578125, 36.67578125, 37.708984375, 38.7421875, 39.775390625, 40.80859375, 41.841796875, 42.875]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 7.0, 14.0, 28.0, 48.0, 82.0, 122.0, 130.0, 160.0, 119.0, 119.0, 89.0, 38.0, 23.0, 11.0, 11.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-87.89315795898438, -83.9896011352539, -80.08605194091797, -76.1824951171875, -72.27893829345703, -68.37538146972656, -64.47183227539062, -60.568275451660156, -56.66472244262695, -52.76116943359375, -48.85761260986328, -44.95405960083008, -41.050506591796875, -37.146949768066406, -33.2433967590332, -29.339841842651367, -25.43628692626953, -21.532732009887695, -17.62917709350586, -13.725624084472656, -9.82206916809082, -5.918514251708984, -2.0149612426757812, 1.8885936737060547, 5.792148590087891, 9.695703506469727, 13.599257469177246, 17.502811431884766, 21.4063663482666, 25.309921264648438, 29.21347427368164, 33.117027282714844, 37.02058410644531, 40.924137115478516, 44.827693939208984, 48.73124694824219, 52.634803771972656, 56.53835678100586, 60.44190979003906, 64.34546661376953, 68.2490234375, 72.15258026123047, 76.0561294555664, 79.95968627929688, 83.86324310302734, 87.76679992675781, 91.67034912109375, 95.57390594482422, 99.47745513916016, 103.38101196289062, 107.28456115722656, 111.18811798095703, 115.0916748046875, 118.99522399902344, 122.8987808227539, 126.80233764648438, 130.7058868408203, 134.60943603515625, 138.51300048828125, 142.4165496826172, 146.32009887695312, 150.22366333007812, 154.12721252441406, 158.03076171875, 161.934326171875]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 4.0, 3.0, 5.0, 10.0, 13.0, 11.0, 15.0, 15.0, 16.0, 12.0, 15.0, 29.0, 21.0, 28.0, 26.0, 32.0, 38.0, 36.0, 33.0, 30.0, 31.0, 30.0, 47.0, 41.0, 48.0, 38.0, 28.0, 27.0, 29.0, 31.0, 30.0, 28.0, 18.0, 27.0, 28.0, 15.0, 13.0, 11.0, 18.0, 17.0, 7.0, 10.0, 5.0, 6.0, 6.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-54.07867431640625, -52.431583404541016, -50.78449249267578, -49.13740158081055, -47.49031066894531, -45.84321594238281, -44.19612503051758, -42.549034118652344, -40.90194320678711, -39.254852294921875, -37.60776138305664, -35.960670471191406, -34.313575744628906, -32.66648864746094, -31.019393920898438, -29.372303009033203, -27.72521209716797, -26.078121185302734, -24.4310302734375, -22.783937454223633, -21.1368465423584, -19.489755630493164, -17.842662811279297, -16.195571899414062, -14.548480987548828, -12.901390075683594, -11.254298210144043, -9.607206344604492, -7.960115432739258, -6.313024520874023, -4.665932655334473, -3.018840789794922, -1.3717498779296875, 0.2753415107727051, 1.9224328994750977, 3.5695242881774902, 5.216615676879883, 6.863706588745117, 8.510798454284668, 10.157890319824219, 11.804981231689453, 13.452072143554688, 15.099164009094238, 16.74625587463379, 18.393346786499023, 20.040437698364258, 21.687530517578125, 23.33462142944336, 24.981712341308594, 26.628803253173828, 28.275894165039062, 29.92298698425293, 31.570077896118164, 33.21717071533203, 34.864261627197266, 36.5113525390625, 38.158443450927734, 39.80553436279297, 41.4526252746582, 43.09971618652344, 44.74681091308594, 46.393898010253906, 48.040992736816406, 49.68808364868164, 51.335174560546875]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 6.0, 6.0, 9.0, 4.0, 4.0, 4.0, 10.0, 8.0, 6.0, 16.0, 15.0, 14.0, 14.0, 23.0, 23.0, 34.0, 36.0, 34.0, 37.0, 26.0, 39.0, 45.0, 46.0, 37.0, 44.0, 43.0, 34.0, 51.0, 37.0, 39.0, 33.0, 26.0, 30.0, 29.0, 24.0, 21.0, 18.0, 13.0, 11.0, 6.0, 10.0, 9.0, 10.0, 5.0, 8.0, 3.0, 1.0, 5.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0], "bins": [-7.35546875, -7.13275146484375, -6.9100341796875, -6.68731689453125, -6.464599609375, -6.24188232421875, -6.0191650390625, -5.79644775390625, -5.57373046875, -5.35101318359375, -5.1282958984375, -4.90557861328125, -4.682861328125, -4.46014404296875, -4.2374267578125, -4.01470947265625, -3.7919921875, -3.56927490234375, -3.3465576171875, -3.12384033203125, -2.901123046875, -2.67840576171875, -2.4556884765625, -2.23297119140625, -2.01025390625, -1.78753662109375, -1.5648193359375, -1.34210205078125, -1.119384765625, -0.89666748046875, -0.6739501953125, -0.45123291015625, -0.228515625, -0.00579833984375, 0.2169189453125, 0.43963623046875, 0.662353515625, 0.88507080078125, 1.1077880859375, 1.33050537109375, 1.55322265625, 1.77593994140625, 1.9986572265625, 2.22137451171875, 2.444091796875, 2.66680908203125, 2.8895263671875, 3.11224365234375, 3.3349609375, 3.55767822265625, 3.7803955078125, 4.00311279296875, 4.225830078125, 4.44854736328125, 4.6712646484375, 4.89398193359375, 5.11669921875, 5.33941650390625, 5.5621337890625, 5.78485107421875, 6.007568359375, 6.23028564453125, 6.4530029296875, 6.67572021484375, 6.8984375]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 11.0, 14.0, 14.0, 24.0, 47.0, 42.0, 75.0, 89.0, 152.0, 228.0, 328.0, 504.0, 734.0, 1073.0, 1530.0, 2178.0, 3389.0, 4977.0, 7556.0, 11238.0, 16924.0, 25896.0, 39683.0, 59701.0, 89308.0, 125731.0, 159288.0, 150508.0, 113988.0, 78668.0, 52652.0, 34570.0, 22522.0, 14874.0, 9817.0, 6563.0, 4363.0, 2942.0, 2013.0, 1363.0, 993.0, 612.0, 437.0, 292.0, 210.0, 137.0, 108.0, 56.0, 56.0, 22.0, 23.0, 15.0, 11.0, 5.0, 7.0, 5.0, 0.0, 2.0], "bins": [-0.51513671875, -0.49945068359375, -0.4837646484375, -0.46807861328125, -0.452392578125, -0.43670654296875, -0.4210205078125, -0.40533447265625, -0.3896484375, -0.37396240234375, -0.3582763671875, -0.34259033203125, -0.326904296875, -0.31121826171875, -0.2955322265625, -0.27984619140625, -0.26416015625, -0.24847412109375, -0.2327880859375, -0.21710205078125, -0.201416015625, -0.18572998046875, -0.1700439453125, -0.15435791015625, -0.138671875, -0.12298583984375, -0.1072998046875, -0.09161376953125, -0.075927734375, -0.06024169921875, -0.0445556640625, -0.02886962890625, -0.01318359375, 0.00250244140625, 0.0181884765625, 0.03387451171875, 0.049560546875, 0.06524658203125, 0.0809326171875, 0.09661865234375, 0.1123046875, 0.12799072265625, 0.1436767578125, 0.15936279296875, 0.175048828125, 0.19073486328125, 0.2064208984375, 0.22210693359375, 0.23779296875, 0.25347900390625, 0.2691650390625, 0.28485107421875, 0.300537109375, 0.31622314453125, 0.3319091796875, 0.34759521484375, 0.36328125, 0.37896728515625, 0.3946533203125, 0.41033935546875, 0.426025390625, 0.44171142578125, 0.4573974609375, 0.47308349609375, 0.48876953125]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 6.0, 13.0, 4.0, 10.0, 15.0, 15.0, 22.0, 14.0, 13.0, 22.0, 19.0, 29.0, 28.0, 26.0, 31.0, 38.0, 30.0, 38.0, 35.0, 24.0, 34.0, 1077.0, 43.0, 45.0, 39.0, 42.0, 28.0, 33.0, 29.0, 27.0, 15.0, 20.0, 14.0, 18.0, 23.0, 15.0, 22.0, 11.0, 10.0, 14.0, 10.0, 9.0, 2.0, 3.0, 1.0, 1.0, 2.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.9921875, -3.85650634765625, -3.7208251953125, -3.58514404296875, -3.449462890625, -3.31378173828125, -3.1781005859375, -3.04241943359375, -2.90673828125, -2.77105712890625, -2.6353759765625, -2.49969482421875, -2.364013671875, -2.22833251953125, -2.0926513671875, -1.95697021484375, -1.8212890625, -1.68560791015625, -1.5499267578125, -1.41424560546875, -1.278564453125, -1.14288330078125, -1.0072021484375, -0.87152099609375, -0.73583984375, -0.60015869140625, -0.4644775390625, -0.32879638671875, -0.193115234375, -0.05743408203125, 0.0782470703125, 0.21392822265625, 0.349609375, 0.48529052734375, 0.6209716796875, 0.75665283203125, 0.892333984375, 1.02801513671875, 1.1636962890625, 1.29937744140625, 1.43505859375, 1.57073974609375, 1.7064208984375, 1.84210205078125, 1.977783203125, 2.11346435546875, 2.2491455078125, 2.38482666015625, 2.5205078125, 2.65618896484375, 2.7918701171875, 2.92755126953125, 3.063232421875, 3.19891357421875, 3.3345947265625, 3.47027587890625, 3.60595703125, 3.74163818359375, 3.8773193359375, 4.01300048828125, 4.148681640625, 4.28436279296875, 4.4200439453125, 4.55572509765625, 4.69140625]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 4.0, 8.0, 10.0, 29.0, 37.0, 48.0, 102.0, 149.0, 189.0, 299.0, 471.0, 730.0, 1200.0, 1955.0, 3039.0, 4810.0, 7704.0, 12317.0, 19660.0, 31202.0, 49694.0, 75387.0, 108689.0, 151303.0, 1192186.0, 139257.0, 102477.0, 70776.0, 45867.0, 28897.0, 18265.0, 11308.0, 7164.0, 4357.0, 2693.0, 1776.0, 1088.0, 739.0, 445.0, 286.0, 186.0, 102.0, 63.0, 50.0, 36.0, 19.0, 21.0, 18.0, 11.0, 7.0, 4.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.38671875, -0.37514495849609375, -0.3635711669921875, -0.35199737548828125, -0.340423583984375, -0.32884979248046875, -0.3172760009765625, -0.30570220947265625, -0.29412841796875, -0.28255462646484375, -0.2709808349609375, -0.25940704345703125, -0.247833251953125, -0.23625946044921875, -0.2246856689453125, -0.21311187744140625, -0.2015380859375, -0.18996429443359375, -0.1783905029296875, -0.16681671142578125, -0.155242919921875, -0.14366912841796875, -0.1320953369140625, -0.12052154541015625, -0.10894775390625, -0.09737396240234375, -0.0858001708984375, -0.07422637939453125, -0.062652587890625, -0.05107879638671875, -0.0395050048828125, -0.02793121337890625, -0.016357421875, -0.00478363037109375, 0.0067901611328125, 0.01836395263671875, 0.029937744140625, 0.04151153564453125, 0.0530853271484375, 0.06465911865234375, 0.07623291015625, 0.08780670166015625, 0.0993804931640625, 0.11095428466796875, 0.122528076171875, 0.13410186767578125, 0.1456756591796875, 0.15724945068359375, 0.1688232421875, 0.18039703369140625, 0.1919708251953125, 0.20354461669921875, 0.215118408203125, 0.22669219970703125, 0.2382659912109375, 0.24983978271484375, 0.26141357421875, 0.27298736572265625, 0.2845611572265625, 0.29613494873046875, 0.307708740234375, 0.31928253173828125, 0.3308563232421875, 0.34243011474609375, 0.35400390625]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 1.0, 6.0, 6.0, 6.0, 7.0, 6.0, 2.0, 15.0, 15.0, 14.0, 14.0, 12.0, 31.0, 23.0, 30.0, 51.0, 62.0, 66.0, 71.0, 60.0, 68.0, 74.0, 56.0, 44.0, 43.0, 39.0, 34.0, 20.0, 23.0, 17.0, 18.0, 5.0, 12.0, 13.0, 10.0, 2.0, 6.0, 5.0, 3.0, 5.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.00901031494140625, -0.00873422622680664, -0.008458137512207031, -0.008182048797607422, -0.007905960083007812, -0.007629871368408203, -0.007353782653808594, -0.007077693939208984, -0.006801605224609375, -0.006525516510009766, -0.006249427795410156, -0.005973339080810547, -0.0056972503662109375, -0.005421161651611328, -0.005145072937011719, -0.004868984222412109, -0.0045928955078125, -0.004316806793212891, -0.004040718078613281, -0.003764629364013672, -0.0034885406494140625, -0.003212451934814453, -0.0029363632202148438, -0.0026602745056152344, -0.002384185791015625, -0.0021080970764160156, -0.0018320083618164062, -0.0015559196472167969, -0.0012798309326171875, -0.0010037422180175781, -0.0007276535034179688, -0.0004515647888183594, -0.00017547607421875, 0.00010061264038085938, 0.00037670135498046875, 0.0006527900695800781, 0.0009288787841796875, 0.0012049674987792969, 0.0014810562133789062, 0.0017571449279785156, 0.002033233642578125, 0.0023093223571777344, 0.0025854110717773438, 0.002861499786376953, 0.0031375885009765625, 0.003413677215576172, 0.0036897659301757812, 0.003965854644775391, 0.004241943359375, 0.004518032073974609, 0.004794120788574219, 0.005070209503173828, 0.0053462982177734375, 0.005622386932373047, 0.005898475646972656, 0.006174564361572266, 0.006450653076171875, 0.006726741790771484, 0.007002830505371094, 0.007278919219970703, 0.0075550079345703125, 0.007831096649169922, 0.008107185363769531, 0.00838327407836914, 0.00865936279296875]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 2.0, 5.0, 2.0, 3.0, 3.0, 7.0, 10.0, 22.0, 13.0, 19.0, 30.0, 38.0, 45.0, 53.0, 79.0, 93.0, 141.0, 193.0, 338.0, 744.0, 9317.0, 907760.0, 125970.0, 2273.0, 482.0, 232.0, 187.0, 122.0, 81.0, 56.0, 49.0, 37.0, 35.0, 25.0, 16.0, 10.0, 11.0, 12.0, 9.0, 7.0, 9.0, 7.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 1.0], "bins": [-0.1536865234375, -0.14899826049804688, -0.14430999755859375, -0.13962173461914062, -0.1349334716796875, -0.13024520874023438, -0.12555694580078125, -0.12086868286132812, -0.116180419921875, -0.11149215698242188, -0.10680389404296875, -0.10211563110351562, -0.0974273681640625, -0.09273910522460938, -0.08805084228515625, -0.08336257934570312, -0.07867431640625, -0.07398605346679688, -0.06929779052734375, -0.06460952758789062, -0.0599212646484375, -0.055233001708984375, -0.05054473876953125, -0.045856475830078125, -0.041168212890625, -0.036479949951171875, -0.03179168701171875, -0.027103424072265625, -0.0224151611328125, -0.017726898193359375, -0.01303863525390625, -0.008350372314453125, -0.003662109375, 0.001026153564453125, 0.00571441650390625, 0.010402679443359375, 0.0150909423828125, 0.019779205322265625, 0.02446746826171875, 0.029155731201171875, 0.033843994140625, 0.038532257080078125, 0.04322052001953125, 0.047908782958984375, 0.0525970458984375, 0.057285308837890625, 0.06197357177734375, 0.06666183471679688, 0.07135009765625, 0.07603836059570312, 0.08072662353515625, 0.08541488647460938, 0.0901031494140625, 0.09479141235351562, 0.09947967529296875, 0.10416793823242188, 0.108856201171875, 0.11354446411132812, 0.11823272705078125, 0.12292098999023438, 0.1276092529296875, 0.13229751586914062, 0.13698577880859375, 0.14167404174804688, 0.1463623046875]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 108.0, 633.0, 264.0, 9.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05860211327672005, -0.05719451233744621, -0.05578691512346268, -0.05437931418418884, -0.05297171697020531, -0.05156411603093147, -0.05015651881694794, -0.0487489178776741, -0.04734132066369057, -0.04593371972441673, -0.0445261225104332, -0.04311852157115936, -0.04171092435717583, -0.04030332341790199, -0.03889572620391846, -0.03748812526464462, -0.03608052432537079, -0.034672923386096954, -0.03326532617211342, -0.031857725232839584, -0.03045012801885605, -0.029042528942227364, -0.02763492986559868, -0.026227328926324844, -0.02481973171234131, -0.023412132635712624, -0.02200453355908394, -0.020596934482455254, -0.01918933540582657, -0.017781736329197884, -0.0163741372525692, -0.014966537244617939, -0.013558939099311829, -0.012151340022683144, -0.010743740946054459, -0.009336141869425774, -0.007928542792797089, -0.006520943250507116, -0.005113343708217144, -0.003705744631588459, -0.002298145554959774, -0.0008905463619157672, 0.0005170528311282396, 0.0019246521405875683, 0.0033322512172162533, 0.004739850293844938, 0.006147449836134911, 0.007555048912763596, 0.00896264798939228, 0.010370247066020966, 0.01177784614264965, 0.013185445219278336, 0.01459304429590702, 0.016000643372535706, 0.01740824431180954, 0.018815841525793076, 0.02022344246506691, 0.021631041541695595, 0.02303864061832428, 0.024446239694952965, 0.02585383877158165, 0.027261437848210335, 0.02866903692483902, 0.030076637864112854, 0.03148423507809639]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 5.0, 2.0, 6.0, 7.0, 7.0, 7.0, 6.0, 15.0, 14.0, 14.0, 17.0, 14.0, 19.0, 21.0, 32.0, 26.0, 28.0, 32.0, 31.0, 28.0, 36.0, 44.0, 38.0, 42.0, 49.0, 33.0, 36.0, 52.0, 39.0, 34.0, 33.0, 30.0, 17.0, 26.0, 20.0, 28.0, 13.0, 22.0, 17.0, 16.0, 14.0, 10.0, 7.0, 4.0, 6.0, 2.0, 5.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.004636287689208984, -0.004491076804697514, -0.004345865920186043, -0.004200655035674572, -0.004055444151163101, -0.00391023326665163, -0.0037650223821401596, -0.003619811497628689, -0.003474600613117218, -0.0033293897286057472, -0.0031841788440942764, -0.0030389679595828056, -0.002893757075071335, -0.002748546190559864, -0.0026033353060483932, -0.0024581244215369225, -0.0023129135370254517, -0.002167702652513981, -0.00202249176800251, -0.0018772808834910393, -0.0017320699989795685, -0.0015868591144680977, -0.001441648229956627, -0.001296437345445156, -0.0011512264609336853, -0.0010060155764222145, -0.0008608046919107437, -0.0007155938073992729, -0.0005703829228878021, -0.00042517203837633133, -0.00027996115386486053, -0.00013475026935338974, 1.0460615158081055e-05, 0.00015567149966955185, 0.00030088238418102264, 0.00044609326869249344, 0.0005913041532039642, 0.000736515037715435, 0.0008817259222269058, 0.0010269368067383766, 0.0011721476912498474, 0.0013173585757613182, 0.001462569460272789, 0.0016077803447842598, 0.0017529912292957306, 0.0018982021138072014, 0.002043412998318672, 0.002188623882830143, 0.0023338347673416138, 0.0024790456518530846, 0.0026242565363645554, 0.002769467420876026, 0.002914678305387497, 0.0030598891898989677, 0.0032051000744104385, 0.0033503109589219093, 0.00349552184343338, 0.003640732727944851, 0.0037859436124563217, 0.0039311544969677925, 0.004076365381479263, 0.004221576265990734, 0.004366787150502205, 0.004511998035013676, 0.0046572089195251465]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 6.0, 6.0, 9.0, 4.0, 4.0, 4.0, 10.0, 8.0, 6.0, 16.0, 15.0, 14.0, 14.0, 23.0, 23.0, 34.0, 36.0, 34.0, 37.0, 25.0, 40.0, 45.0, 46.0, 37.0, 44.0, 43.0, 34.0, 51.0, 37.0, 39.0, 33.0, 26.0, 30.0, 29.0, 24.0, 21.0, 18.0, 13.0, 11.0, 6.0, 10.0, 9.0, 10.0, 5.0, 8.0, 3.0, 1.0, 5.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0], "bins": [-7.35546875, -7.13275146484375, -6.9100341796875, -6.68731689453125, -6.464599609375, -6.24188232421875, -6.0191650390625, -5.79644775390625, -5.57373046875, -5.35101318359375, -5.1282958984375, -4.90557861328125, -4.682861328125, -4.46014404296875, -4.2374267578125, -4.01470947265625, -3.7919921875, -3.56927490234375, -3.3465576171875, -3.12384033203125, -2.901123046875, -2.67840576171875, -2.4556884765625, -2.23297119140625, -2.01025390625, -1.78753662109375, -1.5648193359375, -1.34210205078125, -1.119384765625, -0.89666748046875, -0.6739501953125, -0.45123291015625, -0.228515625, -0.00579833984375, 0.2169189453125, 0.43963623046875, 0.662353515625, 0.88507080078125, 1.1077880859375, 1.33050537109375, 1.55322265625, 1.77593994140625, 1.9986572265625, 2.22137451171875, 2.444091796875, 2.66680908203125, 2.8895263671875, 3.11224365234375, 3.3349609375, 3.55767822265625, 3.7803955078125, 4.00311279296875, 4.225830078125, 4.44854736328125, 4.6712646484375, 4.89398193359375, 5.11669921875, 5.33941650390625, 5.5621337890625, 5.78485107421875, 6.007568359375, 6.23028564453125, 6.4530029296875, 6.67572021484375, 6.8984375]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 5.0, 9.0, 7.0, 12.0, 5.0, 13.0, 15.0, 18.0, 35.0, 45.0, 83.0, 121.0, 203.0, 353.0, 638.0, 1017.0, 1738.0, 3031.0, 5467.0, 10320.0, 20907.0, 48918.0, 134121.0, 357145.0, 286598.0, 101926.0, 38505.0, 17507.0, 8833.0, 4644.0, 2648.0, 1448.0, 873.0, 525.0, 307.0, 175.0, 116.0, 70.0, 50.0, 22.0, 30.0, 14.0, 7.0, 7.0, 6.0, 10.0, 2.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-4.296875, -4.16204833984375, -4.0272216796875, -3.89239501953125, -3.757568359375, -3.62274169921875, -3.4879150390625, -3.35308837890625, -3.21826171875, -3.08343505859375, -2.9486083984375, -2.81378173828125, -2.678955078125, -2.54412841796875, -2.4093017578125, -2.27447509765625, -2.1396484375, -2.00482177734375, -1.8699951171875, -1.73516845703125, -1.600341796875, -1.46551513671875, -1.3306884765625, -1.19586181640625, -1.06103515625, -0.92620849609375, -0.7913818359375, -0.65655517578125, -0.521728515625, -0.38690185546875, -0.2520751953125, -0.11724853515625, 0.017578125, 0.15240478515625, 0.2872314453125, 0.42205810546875, 0.556884765625, 0.69171142578125, 0.8265380859375, 0.96136474609375, 1.09619140625, 1.23101806640625, 1.3658447265625, 1.50067138671875, 1.635498046875, 1.77032470703125, 1.9051513671875, 2.03997802734375, 2.1748046875, 2.30963134765625, 2.4444580078125, 2.57928466796875, 2.714111328125, 2.84893798828125, 2.9837646484375, 3.11859130859375, 3.25341796875, 3.38824462890625, 3.5230712890625, 3.65789794921875, 3.792724609375, 3.92755126953125, 4.0623779296875, 4.19720458984375, 4.33203125]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 4.0, 9.0, 6.0, 5.0, 10.0, 10.0, 20.0, 19.0, 25.0, 29.0, 31.0, 33.0, 37.0, 31.0, 44.0, 55.0, 65.0, 141.0, 1741.0, 251.0, 80.0, 61.0, 51.0, 44.0, 34.0, 28.0, 36.0, 24.0, 25.0, 20.0, 17.0, 13.0, 14.0, 12.0, 7.0, 10.0, 8.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.5, -26.573486328125, -25.64697265625, -24.720458984375, -23.7939453125, -22.867431640625, -21.94091796875, -21.014404296875, -20.087890625, -19.161376953125, -18.23486328125, -17.308349609375, -16.3818359375, -15.455322265625, -14.52880859375, -13.602294921875, -12.67578125, -11.749267578125, -10.82275390625, -9.896240234375, -8.9697265625, -8.043212890625, -7.11669921875, -6.190185546875, -5.263671875, -4.337158203125, -3.41064453125, -2.484130859375, -1.5576171875, -0.631103515625, 0.29541015625, 1.221923828125, 2.1484375, 3.074951171875, 4.00146484375, 4.927978515625, 5.8544921875, 6.781005859375, 7.70751953125, 8.634033203125, 9.560546875, 10.487060546875, 11.41357421875, 12.340087890625, 13.2666015625, 14.193115234375, 15.11962890625, 16.046142578125, 16.97265625, 17.899169921875, 18.82568359375, 19.752197265625, 20.6787109375, 21.605224609375, 22.53173828125, 23.458251953125, 24.384765625, 25.311279296875, 26.23779296875, 27.164306640625, 28.0908203125, 29.017333984375, 29.94384765625, 30.870361328125, 31.796875]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 4.0, 6.0, 10.0, 6.0, 19.0, 13.0, 8.0, 21.0, 27.0, 33.0, 30.0, 46.0, 55.0, 112.0, 151.0, 273.0, 494.0, 1806.0, 96282.0, 3036736.0, 7757.0, 830.0, 359.0, 188.0, 105.0, 77.0, 66.0, 45.0, 40.0, 28.0, 16.0, 17.0, 11.0, 8.0, 9.0, 6.0, 8.0, 5.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.90625, -50.39111328125, -48.8759765625, -47.36083984375, -45.845703125, -44.33056640625, -42.8154296875, -41.30029296875, -39.78515625, -38.27001953125, -36.7548828125, -35.23974609375, -33.724609375, -32.20947265625, -30.6943359375, -29.17919921875, -27.6640625, -26.14892578125, -24.6337890625, -23.11865234375, -21.603515625, -20.08837890625, -18.5732421875, -17.05810546875, -15.54296875, -14.02783203125, -12.5126953125, -10.99755859375, -9.482421875, -7.96728515625, -6.4521484375, -4.93701171875, -3.421875, -1.90673828125, -0.3916015625, 1.12353515625, 2.638671875, 4.15380859375, 5.6689453125, 7.18408203125, 8.69921875, 10.21435546875, 11.7294921875, 13.24462890625, 14.759765625, 16.27490234375, 17.7900390625, 19.30517578125, 20.8203125, 22.33544921875, 23.8505859375, 25.36572265625, 26.880859375, 28.39599609375, 29.9111328125, 31.42626953125, 32.94140625, 34.45654296875, 35.9716796875, 37.48681640625, 39.001953125, 40.51708984375, 42.0322265625, 43.54736328125, 45.0625]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 7.0, 68.0, 253.0, 427.0, 203.0, 48.0, 8.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.062313079833984, -42.47664260864258, -39.89097595214844, -37.30530548095703, -34.71963882446289, -32.133968353271484, -29.54829978942871, -26.962631225585938, -24.376962661743164, -21.79129409790039, -19.205625534057617, -16.619956970214844, -14.034287452697754, -11.44861888885498, -8.86294937133789, -6.277280807495117, -3.6916122436523438, -1.1059434413909912, 1.4797253608703613, 4.065394401550293, 6.651062965393066, 9.23673152923584, 11.82240104675293, 14.408069610595703, 16.993738174438477, 19.57940673828125, 22.165075302124023, 24.750743865966797, 27.336414337158203, 29.922080993652344, 32.50775146484375, 35.093421936035156, 37.67909240722656, 40.26476287841797, 42.85042953491211, 45.436100006103516, 48.021766662597656, 50.60743713378906, 53.19310760498047, 55.77877426147461, 58.36444091796875, 60.950111389160156, 63.5357780456543, 66.12144470214844, 68.70711517333984, 71.29278564453125, 73.87845611572266, 76.46412658691406, 79.04978942871094, 81.63545989990234, 84.22113037109375, 86.80679321289062, 89.39246368408203, 91.97813415527344, 94.56380462646484, 97.14947509765625, 99.73514556884766, 102.32081604003906, 104.90648651123047, 107.49214935302734, 110.07781982421875, 112.66349029541016, 115.24916076660156, 117.83482360839844, 120.42049407958984]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 4.0, 5.0, 8.0, 12.0, 11.0, 20.0, 20.0, 22.0, 16.0, 29.0, 27.0, 38.0, 31.0, 29.0, 64.0, 38.0, 38.0, 55.0, 51.0, 54.0, 49.0, 41.0, 36.0, 36.0, 45.0, 35.0, 30.0, 20.0, 25.0, 22.0, 13.0, 12.0, 12.0, 14.0, 12.0, 8.0, 5.0, 5.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-82.09048461914062, -79.2146987915039, -76.33891296386719, -73.46312713623047, -70.58734130859375, -67.71156311035156, -64.83577728271484, -61.959991455078125, -59.084205627441406, -56.20841979980469, -53.33263397216797, -50.456851959228516, -47.5810661315918, -44.70528030395508, -41.829498291015625, -38.953712463378906, -36.07792663574219, -33.20214080810547, -30.326356887817383, -27.450572967529297, -24.574787139892578, -21.69900131225586, -18.823217391967773, -15.947433471679688, -13.071647644042969, -10.195862770080566, -7.320077896118164, -4.444293022155762, -1.5685081481933594, 1.307276725769043, 4.183061599731445, 7.058845520019531, 9.934623718261719, 12.810408592224121, 15.686193466186523, 18.56197738647461, 21.437763214111328, 24.313549041748047, 27.189332962036133, 30.06511688232422, 32.94090270996094, 35.816688537597656, 38.692474365234375, 41.56825637817383, 44.44404220581055, 47.319828033447266, 50.19561004638672, 53.07139587402344, 55.947181701660156, 58.822967529296875, 61.698753356933594, 64.57453918457031, 67.4503173828125, 70.32610321044922, 73.20188903808594, 76.07767486572266, 78.95346069335938, 81.8292465209961, 84.70503234863281, 87.58081817626953, 90.45660400390625, 93.33238220214844, 96.20816802978516, 99.08395385742188, 101.9597396850586]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 6.0, 6.0, 4.0, 6.0, 6.0, 4.0, 5.0, 5.0, 7.0, 10.0, 13.0, 13.0, 11.0, 12.0, 25.0, 24.0, 25.0, 33.0, 30.0, 35.0, 34.0, 40.0, 34.0, 42.0, 41.0, 39.0, 41.0, 35.0, 38.0, 36.0, 47.0, 42.0, 27.0, 29.0, 32.0, 25.0, 18.0, 18.0, 23.0, 12.0, 16.0, 7.0, 10.0, 7.0, 8.0, 8.0, 8.0, 3.0, 4.0, 1.0, 3.0, 4.0, 0.0, 2.0, 0.0, 3.0, 2.0], "bins": [-7.2109375, -6.99176025390625, -6.7725830078125, -6.55340576171875, -6.334228515625, -6.11505126953125, -5.8958740234375, -5.67669677734375, -5.45751953125, -5.23834228515625, -5.0191650390625, -4.79998779296875, -4.580810546875, -4.36163330078125, -4.1424560546875, -3.92327880859375, -3.7041015625, -3.48492431640625, -3.2657470703125, -3.04656982421875, -2.827392578125, -2.60821533203125, -2.3890380859375, -2.16986083984375, -1.95068359375, -1.73150634765625, -1.5123291015625, -1.29315185546875, -1.073974609375, -0.85479736328125, -0.6356201171875, -0.41644287109375, -0.197265625, 0.02191162109375, 0.2410888671875, 0.46026611328125, 0.679443359375, 0.89862060546875, 1.1177978515625, 1.33697509765625, 1.55615234375, 1.77532958984375, 1.9945068359375, 2.21368408203125, 2.432861328125, 2.65203857421875, 2.8712158203125, 3.09039306640625, 3.3095703125, 3.52874755859375, 3.7479248046875, 3.96710205078125, 4.186279296875, 4.40545654296875, 4.6246337890625, 4.84381103515625, 5.06298828125, 5.28216552734375, 5.5013427734375, 5.72052001953125, 5.939697265625, 6.15887451171875, 6.3780517578125, 6.59722900390625, 6.81640625]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 4.0, 3.0, 3.0, 1.0, 4.0, 7.0, 4.0, 8.0, 13.0, 6.0, 9.0, 8.0, 12.0, 16.0, 27.0, 32.0, 53.0, 78.0, 130.0, 243.0, 583.0, 1586.0, 4998.0, 21585.0, 129150.0, 1343797.0, 2359294.0, 282260.0, 38364.0, 8085.0, 2245.0, 827.0, 357.0, 169.0, 95.0, 48.0, 34.0, 36.0, 22.0, 14.0, 21.0, 9.0, 15.0, 9.0, 5.0, 5.0, 6.0, 3.0, 6.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-20.15625, -19.52978515625, -18.9033203125, -18.27685546875, -17.650390625, -17.02392578125, -16.3974609375, -15.77099609375, -15.14453125, -14.51806640625, -13.8916015625, -13.26513671875, -12.638671875, -12.01220703125, -11.3857421875, -10.75927734375, -10.1328125, -9.50634765625, -8.8798828125, -8.25341796875, -7.626953125, -7.00048828125, -6.3740234375, -5.74755859375, -5.12109375, -4.49462890625, -3.8681640625, -3.24169921875, -2.615234375, -1.98876953125, -1.3623046875, -0.73583984375, -0.109375, 0.51708984375, 1.1435546875, 1.77001953125, 2.396484375, 3.02294921875, 3.6494140625, 4.27587890625, 4.90234375, 5.52880859375, 6.1552734375, 6.78173828125, 7.408203125, 8.03466796875, 8.6611328125, 9.28759765625, 9.9140625, 10.54052734375, 11.1669921875, 11.79345703125, 12.419921875, 13.04638671875, 13.6728515625, 14.29931640625, 14.92578125, 15.55224609375, 16.1787109375, 16.80517578125, 17.431640625, 18.05810546875, 18.6845703125, 19.31103515625, 19.9375]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 8.0, 3.0, 2.0, 7.0, 5.0, 3.0, 10.0, 14.0, 21.0, 22.0, 41.0, 52.0, 88.0, 89.0, 146.0, 184.0, 289.0, 376.0, 433.0, 495.0, 453.0, 353.0, 279.0, 219.0, 143.0, 98.0, 79.0, 49.0, 44.0, 20.0, 16.0, 16.0, 14.0, 8.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.7734375, -14.1688232421875, -13.564208984375, -12.9595947265625, -12.35498046875, -11.7503662109375, -11.145751953125, -10.5411376953125, -9.9365234375, -9.3319091796875, -8.727294921875, -8.1226806640625, -7.51806640625, -6.9134521484375, -6.308837890625, -5.7042236328125, -5.099609375, -4.4949951171875, -3.890380859375, -3.2857666015625, -2.68115234375, -2.0765380859375, -1.471923828125, -0.8673095703125, -0.2626953125, 0.3419189453125, 0.946533203125, 1.5511474609375, 2.15576171875, 2.7603759765625, 3.364990234375, 3.9696044921875, 4.57421875, 5.1788330078125, 5.783447265625, 6.3880615234375, 6.99267578125, 7.5972900390625, 8.201904296875, 8.8065185546875, 9.4111328125, 10.0157470703125, 10.620361328125, 11.2249755859375, 11.82958984375, 12.4342041015625, 13.038818359375, 13.6434326171875, 14.248046875, 14.8526611328125, 15.457275390625, 16.0618896484375, 16.66650390625, 17.2711181640625, 17.875732421875, 18.4803466796875, 19.0849609375, 19.6895751953125, 20.294189453125, 20.8988037109375, 21.50341796875, 22.1080322265625, 22.712646484375, 23.3172607421875, 23.921875]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 4.0, 10.0, 7.0, 19.0, 30.0, 38.0, 44.0, 100.0, 116.0, 179.0, 351.0, 777.0, 2198.0, 8830.0, 51461.0, 435118.0, 2871416.0, 728128.0, 78305.0, 12385.0, 2817.0, 906.0, 388.0, 229.0, 132.0, 87.0, 70.0, 32.0, 28.0, 23.0, 15.0, 17.0, 9.0, 7.0, 8.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.59375, -31.52880859375, -30.4638671875, -29.39892578125, -28.333984375, -27.26904296875, -26.2041015625, -25.13916015625, -24.07421875, -23.00927734375, -21.9443359375, -20.87939453125, -19.814453125, -18.74951171875, -17.6845703125, -16.61962890625, -15.5546875, -14.48974609375, -13.4248046875, -12.35986328125, -11.294921875, -10.22998046875, -9.1650390625, -8.10009765625, -7.03515625, -5.97021484375, -4.9052734375, -3.84033203125, -2.775390625, -1.71044921875, -0.6455078125, 0.41943359375, 1.484375, 2.54931640625, 3.6142578125, 4.67919921875, 5.744140625, 6.80908203125, 7.8740234375, 8.93896484375, 10.00390625, 11.06884765625, 12.1337890625, 13.19873046875, 14.263671875, 15.32861328125, 16.3935546875, 17.45849609375, 18.5234375, 19.58837890625, 20.6533203125, 21.71826171875, 22.783203125, 23.84814453125, 24.9130859375, 25.97802734375, 27.04296875, 28.10791015625, 29.1728515625, 30.23779296875, 31.302734375, 32.36767578125, 33.4326171875, 34.49755859375, 35.5625]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 6.0, 4.0, 15.0, 19.0, 36.0, 44.0, 89.0, 98.0, 129.0, 133.0, 94.0, 114.0, 81.0, 66.0, 32.0, 28.0, 12.0, 9.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-96.24629211425781, -92.76132202148438, -89.2763442993164, -85.79137420654297, -82.306396484375, -78.82142639160156, -75.33645629882812, -71.85148620605469, -68.36650848388672, -64.88153839111328, -61.39656066894531, -57.911590576171875, -54.42661666870117, -50.94164276123047, -47.45667266845703, -43.97169876098633, -40.486724853515625, -37.00175094604492, -33.51677703857422, -30.03180694580078, -26.546833038330078, -23.061859130859375, -19.576887130737305, -16.091915130615234, -12.606941223144531, -9.121968269348145, -5.636995315551758, -2.152022361755371, 1.3329505920410156, 4.817924499511719, 8.302896499633789, 11.78786849975586, 15.272834777832031, 18.757808685302734, 22.242780685424805, 25.727752685546875, 29.212726593017578, 32.69770050048828, 36.18267059326172, 39.66764450073242, 43.152618408203125, 46.63759231567383, 50.12256622314453, 53.60753631591797, 57.09251022338867, 60.577484130859375, 64.06245422363281, 67.54742431640625, 71.03240203857422, 74.51737213134766, 78.00234985351562, 81.48731994628906, 84.9722900390625, 88.45726776123047, 91.9422378540039, 95.42721557617188, 98.91218566894531, 102.39715576171875, 105.88213348388672, 109.36710357666016, 112.85208129882812, 116.33705139160156, 119.822021484375, 123.30699157714844, 126.7919692993164]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 4.0, 8.0, 8.0, 4.0, 5.0, 18.0, 19.0, 23.0, 30.0, 10.0, 28.0, 28.0, 24.0, 37.0, 37.0, 51.0, 42.0, 41.0, 39.0, 51.0, 37.0, 44.0, 36.0, 34.0, 32.0, 45.0, 39.0, 32.0, 32.0, 21.0, 25.0, 20.0, 11.0, 23.0, 16.0, 16.0, 5.0, 10.0, 7.0, 8.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-65.80789184570312, -63.88043212890625, -61.95297622680664, -60.02552032470703, -58.098060607910156, -56.17060089111328, -54.24314498901367, -52.31568908691406, -50.38822937011719, -48.46076965332031, -46.5333137512207, -44.605857849121094, -42.67839813232422, -40.750938415527344, -38.823482513427734, -36.896026611328125, -34.96856689453125, -33.041107177734375, -31.113651275634766, -29.186193466186523, -27.25873565673828, -25.33127784729004, -23.403820037841797, -21.476362228393555, -19.548904418945312, -17.62144660949707, -15.693988800048828, -13.766530990600586, -11.839073181152344, -9.911615371704102, -7.984157562255859, -6.056699752807617, -4.129241943359375, -2.201784133911133, -0.2743263244628906, 1.6531314849853516, 3.5805892944335938, 5.508047103881836, 7.435504913330078, 9.36296272277832, 11.290420532226562, 13.217878341674805, 15.145336151123047, 17.07279396057129, 19.00025177001953, 20.927709579467773, 22.855167388916016, 24.782625198364258, 26.7100830078125, 28.637540817260742, 30.564998626708984, 32.492454528808594, 34.41991424560547, 36.347373962402344, 38.27482986450195, 40.20228576660156, 42.12974548339844, 44.05720520019531, 45.98466110229492, 47.91211700439453, 49.839576721191406, 51.76703643798828, 53.69449234008789, 55.6219482421875, 57.549407958984375]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 3.0, 4.0, 4.0, 7.0, 6.0, 9.0, 10.0, 7.0, 14.0, 15.0, 17.0, 10.0, 22.0, 28.0, 17.0, 31.0, 34.0, 37.0, 42.0, 32.0, 27.0, 53.0, 42.0, 42.0, 50.0, 42.0, 38.0, 33.0, 34.0, 32.0, 34.0, 23.0, 32.0, 27.0, 20.0, 22.0, 15.0, 19.0, 14.0, 13.0, 8.0, 7.0, 9.0, 6.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-7.296875, -7.06591796875, -6.8349609375, -6.60400390625, -6.373046875, -6.14208984375, -5.9111328125, -5.68017578125, -5.44921875, -5.21826171875, -4.9873046875, -4.75634765625, -4.525390625, -4.29443359375, -4.0634765625, -3.83251953125, -3.6015625, -3.37060546875, -3.1396484375, -2.90869140625, -2.677734375, -2.44677734375, -2.2158203125, -1.98486328125, -1.75390625, -1.52294921875, -1.2919921875, -1.06103515625, -0.830078125, -0.59912109375, -0.3681640625, -0.13720703125, 0.09375, 0.32470703125, 0.5556640625, 0.78662109375, 1.017578125, 1.24853515625, 1.4794921875, 1.71044921875, 1.94140625, 2.17236328125, 2.4033203125, 2.63427734375, 2.865234375, 3.09619140625, 3.3271484375, 3.55810546875, 3.7890625, 4.02001953125, 4.2509765625, 4.48193359375, 4.712890625, 4.94384765625, 5.1748046875, 5.40576171875, 5.63671875, 5.86767578125, 6.0986328125, 6.32958984375, 6.560546875, 6.79150390625, 7.0224609375, 7.25341796875, 7.484375]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 8.0, 11.0, 11.0, 20.0, 18.0, 36.0, 68.0, 81.0, 127.0, 164.0, 261.0, 387.0, 575.0, 832.0, 1132.0, 1774.0, 2611.0, 4083.0, 6021.0, 9658.0, 14698.0, 23312.0, 36591.0, 57164.0, 88719.0, 131944.0, 169400.0, 160801.0, 117976.0, 79129.0, 50871.0, 31920.0, 20270.0, 13003.0, 8400.0, 5492.0, 3607.0, 2457.0, 1563.0, 1069.0, 736.0, 485.0, 335.0, 257.0, 148.0, 113.0, 80.0, 50.0, 33.0, 21.0, 16.0, 10.0, 4.0, 5.0, 5.0, 1.0, 3.0], "bins": [-0.578125, -0.5610504150390625, -0.543975830078125, -0.5269012451171875, -0.50982666015625, -0.4927520751953125, -0.475677490234375, -0.4586029052734375, -0.4415283203125, -0.4244537353515625, -0.407379150390625, -0.3903045654296875, -0.37322998046875, -0.3561553955078125, -0.339080810546875, -0.3220062255859375, -0.304931640625, -0.2878570556640625, -0.270782470703125, -0.2537078857421875, -0.23663330078125, -0.2195587158203125, -0.202484130859375, -0.1854095458984375, -0.1683349609375, -0.1512603759765625, -0.134185791015625, -0.1171112060546875, -0.10003662109375, -0.0829620361328125, -0.065887451171875, -0.0488128662109375, -0.03173828125, -0.0146636962890625, 0.002410888671875, 0.0194854736328125, 0.03656005859375, 0.0536346435546875, 0.070709228515625, 0.0877838134765625, 0.1048583984375, 0.1219329833984375, 0.139007568359375, 0.1560821533203125, 0.17315673828125, 0.1902313232421875, 0.207305908203125, 0.2243804931640625, 0.241455078125, 0.2585296630859375, 0.275604248046875, 0.2926788330078125, 0.30975341796875, 0.3268280029296875, 0.343902587890625, 0.3609771728515625, 0.3780517578125, 0.3951263427734375, 0.412200927734375, 0.4292755126953125, 0.44635009765625, 0.4634246826171875, 0.480499267578125, 0.4975738525390625, 0.5146484375]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 5.0, 5.0, 2.0, 8.0, 10.0, 9.0, 11.0, 11.0, 14.0, 13.0, 19.0, 18.0, 21.0, 26.0, 29.0, 33.0, 34.0, 36.0, 41.0, 39.0, 44.0, 39.0, 37.0, 1057.0, 34.0, 32.0, 32.0, 38.0, 40.0, 36.0, 32.0, 24.0, 24.0, 23.0, 14.0, 21.0, 19.0, 22.0, 16.0, 7.0, 15.0, 12.0, 5.0, 7.0, 4.0, 5.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-4.875, -4.73162841796875, -4.5882568359375, -4.44488525390625, -4.301513671875, -4.15814208984375, -4.0147705078125, -3.87139892578125, -3.72802734375, -3.58465576171875, -3.4412841796875, -3.29791259765625, -3.154541015625, -3.01116943359375, -2.8677978515625, -2.72442626953125, -2.5810546875, -2.43768310546875, -2.2943115234375, -2.15093994140625, -2.007568359375, -1.86419677734375, -1.7208251953125, -1.57745361328125, -1.43408203125, -1.29071044921875, -1.1473388671875, -1.00396728515625, -0.860595703125, -0.71722412109375, -0.5738525390625, -0.43048095703125, -0.287109375, -0.14373779296875, -0.0003662109375, 0.14300537109375, 0.286376953125, 0.42974853515625, 0.5731201171875, 0.71649169921875, 0.85986328125, 1.00323486328125, 1.1466064453125, 1.28997802734375, 1.433349609375, 1.57672119140625, 1.7200927734375, 1.86346435546875, 2.0068359375, 2.15020751953125, 2.2935791015625, 2.43695068359375, 2.580322265625, 2.72369384765625, 2.8670654296875, 3.01043701171875, 3.15380859375, 3.29718017578125, 3.4405517578125, 3.58392333984375, 3.727294921875, 3.87066650390625, 4.0140380859375, 4.15740966796875, 4.30078125]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 6.0, 3.0, 5.0, 7.0, 13.0, 13.0, 29.0, 31.0, 50.0, 94.0, 161.0, 216.0, 357.0, 558.0, 910.0, 1484.0, 2495.0, 4175.0, 6664.0, 11552.0, 19976.0, 33695.0, 57113.0, 93644.0, 140579.0, 1152440.0, 241378.0, 126725.0, 81843.0, 49338.0, 29297.0, 16928.0, 10016.0, 5929.0, 3668.0, 2161.0, 1350.0, 844.0, 521.0, 306.0, 186.0, 142.0, 80.0, 55.0, 29.0, 21.0, 24.0, 11.0, 7.0, 6.0, 0.0, 2.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.4306640625, -0.41670989990234375, -0.4027557373046875, -0.38880157470703125, -0.374847412109375, -0.36089324951171875, -0.3469390869140625, -0.33298492431640625, -0.31903076171875, -0.30507659912109375, -0.2911224365234375, -0.27716827392578125, -0.263214111328125, -0.24925994873046875, -0.2353057861328125, -0.22135162353515625, -0.2073974609375, -0.19344329833984375, -0.1794891357421875, -0.16553497314453125, -0.151580810546875, -0.13762664794921875, -0.1236724853515625, -0.10971832275390625, -0.09576416015625, -0.08180999755859375, -0.0678558349609375, -0.05390167236328125, -0.039947509765625, -0.02599334716796875, -0.0120391845703125, 0.00191497802734375, 0.015869140625, 0.02982330322265625, 0.0437774658203125, 0.05773162841796875, 0.071685791015625, 0.08563995361328125, 0.0995941162109375, 0.11354827880859375, 0.12750244140625, 0.14145660400390625, 0.1554107666015625, 0.16936492919921875, 0.183319091796875, 0.19727325439453125, 0.2112274169921875, 0.22518157958984375, 0.2391357421875, 0.25308990478515625, 0.2670440673828125, 0.28099822998046875, 0.294952392578125, 0.30890655517578125, 0.3228607177734375, 0.33681488037109375, 0.35076904296875, 0.36472320556640625, 0.3786773681640625, 0.39263153076171875, 0.406585693359375, 0.42053985595703125, 0.4344940185546875, 0.44844818115234375, 0.46240234375]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 1.0, 4.0, 2.0, 1.0, 6.0, 10.0, 14.0, 16.0, 7.0, 11.0, 24.0, 34.0, 44.0, 47.0, 66.0, 92.0, 119.0, 107.0, 93.0, 75.0, 60.0, 35.0, 31.0, 26.0, 21.0, 13.0, 10.0, 2.0, 10.0, 6.0, 4.0, 5.0, 4.0, 2.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01184844970703125, -0.011489391326904297, -0.011130332946777344, -0.01077127456665039, -0.010412216186523438, -0.010053157806396484, -0.009694099426269531, -0.009335041046142578, -0.008975982666015625, -0.008616924285888672, -0.008257865905761719, -0.007898807525634766, -0.0075397491455078125, -0.007180690765380859, -0.006821632385253906, -0.006462574005126953, -0.006103515625, -0.005744457244873047, -0.005385398864746094, -0.005026340484619141, -0.0046672821044921875, -0.004308223724365234, -0.003949165344238281, -0.003590106964111328, -0.003231048583984375, -0.002871990203857422, -0.0025129318237304688, -0.0021538734436035156, -0.0017948150634765625, -0.0014357566833496094, -0.0010766983032226562, -0.0007176399230957031, -0.00035858154296875, 4.76837158203125e-07, 0.00035953521728515625, 0.0007185935974121094, 0.0010776519775390625, 0.0014367103576660156, 0.0017957687377929688, 0.002154827117919922, 0.002513885498046875, 0.002872943878173828, 0.0032320022583007812, 0.0035910606384277344, 0.0039501190185546875, 0.004309177398681641, 0.004668235778808594, 0.005027294158935547, 0.0053863525390625, 0.005745410919189453, 0.006104469299316406, 0.006463527679443359, 0.0068225860595703125, 0.007181644439697266, 0.007540702819824219, 0.007899761199951172, 0.008258819580078125, 0.008617877960205078, 0.008976936340332031, 0.009335994720458984, 0.009695053100585938, 0.01005411148071289, 0.010413169860839844, 0.010772228240966797, 0.01113128662109375]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 7.0, 6.0, 8.0, 7.0, 10.0, 14.0, 16.0, 22.0, 42.0, 62.0, 79.0, 122.0, 209.0, 417.0, 2669.0, 806166.0, 236312.0, 1478.0, 365.0, 185.0, 100.0, 76.0, 48.0, 36.0, 21.0, 22.0, 13.0, 14.0, 7.0, 6.0, 6.0, 1.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.2330322265625, -0.22635650634765625, -0.2196807861328125, -0.21300506591796875, -0.206329345703125, -0.19965362548828125, -0.1929779052734375, -0.18630218505859375, -0.17962646484375, -0.17295074462890625, -0.1662750244140625, -0.15959930419921875, -0.152923583984375, -0.14624786376953125, -0.1395721435546875, -0.13289642333984375, -0.126220703125, -0.11954498291015625, -0.1128692626953125, -0.10619354248046875, -0.099517822265625, -0.09284210205078125, -0.0861663818359375, -0.07949066162109375, -0.07281494140625, -0.06613922119140625, -0.0594635009765625, -0.05278778076171875, -0.046112060546875, -0.03943634033203125, -0.0327606201171875, -0.02608489990234375, -0.0194091796875, -0.01273345947265625, -0.0060577392578125, 0.00061798095703125, 0.007293701171875, 0.01396942138671875, 0.0206451416015625, 0.02732086181640625, 0.03399658203125, 0.04067230224609375, 0.0473480224609375, 0.05402374267578125, 0.060699462890625, 0.06737518310546875, 0.0740509033203125, 0.08072662353515625, 0.08740234375, 0.09407806396484375, 0.1007537841796875, 0.10742950439453125, 0.114105224609375, 0.12078094482421875, 0.1274566650390625, 0.13413238525390625, 0.14080810546875, 0.14748382568359375, 0.1541595458984375, 0.16083526611328125, 0.167510986328125, 0.17418670654296875, 0.1808624267578125, 0.18753814697265625, 0.1942138671875]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 10.0, 172.0, 683.0, 140.0, 12.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08980203419923782, -0.0881827101111412, -0.08656337857246399, -0.08494405448436737, -0.08332473039627075, -0.08170539885759354, -0.08008607476949692, -0.0784667432308197, -0.07684741914272308, -0.07522809505462646, -0.07360876351594925, -0.07198943942785263, -0.07037010788917542, -0.0687507838010788, -0.06713145971298218, -0.06551212817430496, -0.06389280408620834, -0.062273476272821426, -0.06065414845943451, -0.05903482437133789, -0.057415496557950974, -0.055796168744564056, -0.05417684465646744, -0.05255751684308052, -0.050938189029693604, -0.049318861216306686, -0.04769953340291977, -0.04608020931482315, -0.044460881501436234, -0.042841553688049316, -0.0412222295999527, -0.03960290178656578, -0.037983573973178864, -0.036364246159791946, -0.03474491834640503, -0.03312559425830841, -0.031506266444921494, -0.029886938631534576, -0.02826761268079281, -0.02664828673005104, -0.025028957054018974, -0.023409631103277206, -0.02179030328989029, -0.020170975476503372, -0.018551649525761604, -0.016932323575019836, -0.01531299576163292, -0.013693668879568577, -0.012074341997504234, -0.010455015115439892, -0.00883568823337555, -0.007216361351311207, -0.005597034469246864, -0.003977707587182522, -0.0023583807051181793, -0.0007390538230538368, 0.0008802730590105057, 0.002499599941074848, 0.004118926823139191, 0.005738253705203533, 0.007357580587267876, 0.008976907469332218, 0.01059623435139656, 0.012215561233460903, 0.013834888115525246]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 3.0, 2.0, 5.0, 6.0, 9.0, 6.0, 12.0, 10.0, 17.0, 18.0, 30.0, 23.0, 28.0, 32.0, 25.0, 32.0, 32.0, 44.0, 38.0, 41.0, 50.0, 43.0, 43.0, 35.0, 34.0, 46.0, 34.0, 32.0, 44.0, 33.0, 30.0, 36.0, 19.0, 17.0, 18.0, 14.0, 15.0, 9.0, 8.0, 8.0, 7.0, 3.0, 2.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.005070328712463379, -0.004917294718325138, -0.004764260724186897, -0.0046112267300486565, -0.004458192735910416, -0.004305158741772175, -0.004152124747633934, -0.003999090753495693, -0.0038460567593574524, -0.0036930227652192116, -0.0035399887710809708, -0.00338695477694273, -0.003233920782804489, -0.0030808867886662483, -0.0029278527945280075, -0.0027748188003897667, -0.002621784806251526, -0.002468750812113285, -0.0023157168179750443, -0.0021626828238368034, -0.0020096488296985626, -0.0018566148355603218, -0.001703580841422081, -0.0015505468472838402, -0.0013975128531455994, -0.0012444788590073586, -0.0010914448648691177, -0.0009384108707308769, -0.0007853768765926361, -0.0006323428824543953, -0.0004793088883161545, -0.00032627489417791367, -0.00017324090003967285, -2.0206905901432037e-05, 0.00013282708823680878, 0.0002858610823750496, 0.0004388950765132904, 0.0005919290706515312, 0.000744963064789772, 0.0008979970589280128, 0.0010510310530662537, 0.0012040650472044945, 0.0013570990413427353, 0.001510133035480976, 0.001663167029619217, 0.0018162010237574577, 0.0019692350178956985, 0.0021222690120339394, 0.00227530300617218, 0.002428337000310421, 0.002581370994448662, 0.0027344049885869026, 0.0028874389827251434, 0.0030404729768633842, 0.003193506971001625, 0.003346540965139866, 0.0034995749592781067, 0.0036526089534163475, 0.0038056429475545883, 0.003958676941692829, 0.00411171093583107, 0.004264744929969311, 0.004417778924107552, 0.004570812918245792, 0.004723846912384033]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 3.0, 4.0, 4.0, 7.0, 6.0, 9.0, 10.0, 7.0, 14.0, 15.0, 17.0, 10.0, 22.0, 28.0, 17.0, 31.0, 34.0, 37.0, 42.0, 32.0, 27.0, 53.0, 42.0, 42.0, 50.0, 42.0, 38.0, 33.0, 34.0, 32.0, 34.0, 23.0, 32.0, 27.0, 20.0, 22.0, 15.0, 19.0, 14.0, 13.0, 9.0, 6.0, 9.0, 6.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-7.296875, -7.06591796875, -6.8349609375, -6.60400390625, -6.373046875, -6.14208984375, -5.9111328125, -5.68017578125, -5.44921875, -5.21826171875, -4.9873046875, -4.75634765625, -4.525390625, -4.29443359375, -4.0634765625, -3.83251953125, -3.6015625, -3.37060546875, -3.1396484375, -2.90869140625, -2.677734375, -2.44677734375, -2.2158203125, -1.98486328125, -1.75390625, -1.52294921875, -1.2919921875, -1.06103515625, -0.830078125, -0.59912109375, -0.3681640625, -0.13720703125, 0.09375, 0.32470703125, 0.5556640625, 0.78662109375, 1.017578125, 1.24853515625, 1.4794921875, 1.71044921875, 1.94140625, 2.17236328125, 2.4033203125, 2.63427734375, 2.865234375, 3.09619140625, 3.3271484375, 3.55810546875, 3.7890625, 4.02001953125, 4.2509765625, 4.48193359375, 4.712890625, 4.94384765625, 5.1748046875, 5.40576171875, 5.63671875, 5.86767578125, 6.0986328125, 6.32958984375, 6.560546875, 6.79150390625, 7.0224609375, 7.25341796875, 7.484375]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 6.0, 5.0, 11.0, 11.0, 17.0, 16.0, 22.0, 49.0, 68.0, 90.0, 115.0, 199.0, 270.0, 407.0, 698.0, 997.0, 1558.0, 2465.0, 3840.0, 6382.0, 11881.0, 25796.0, 72131.0, 284989.0, 456657.0, 108332.0, 35648.0, 15370.0, 8069.0, 4412.0, 2816.0, 1802.0, 1159.0, 761.0, 505.0, 355.0, 235.0, 142.0, 90.0, 53.0, 36.0, 27.0, 25.0, 21.0, 8.0, 4.0, 4.0, 2.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.42578125, -7.1949462890625, -6.964111328125, -6.7332763671875, -6.50244140625, -6.2716064453125, -6.040771484375, -5.8099365234375, -5.5791015625, -5.3482666015625, -5.117431640625, -4.8865966796875, -4.65576171875, -4.4249267578125, -4.194091796875, -3.9632568359375, -3.732421875, -3.5015869140625, -3.270751953125, -3.0399169921875, -2.80908203125, -2.5782470703125, -2.347412109375, -2.1165771484375, -1.8857421875, -1.6549072265625, -1.424072265625, -1.1932373046875, -0.96240234375, -0.7315673828125, -0.500732421875, -0.2698974609375, -0.0390625, 0.1917724609375, 0.422607421875, 0.6534423828125, 0.88427734375, 1.1151123046875, 1.345947265625, 1.5767822265625, 1.8076171875, 2.0384521484375, 2.269287109375, 2.5001220703125, 2.73095703125, 2.9617919921875, 3.192626953125, 3.4234619140625, 3.654296875, 3.8851318359375, 4.115966796875, 4.3468017578125, 4.57763671875, 4.8084716796875, 5.039306640625, 5.2701416015625, 5.5009765625, 5.7318115234375, 5.962646484375, 6.1934814453125, 6.42431640625, 6.6551513671875, 6.885986328125, 7.1168212890625, 7.34765625]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 7.0, 4.0, 5.0, 1.0, 5.0, 2.0, 5.0, 11.0, 11.0, 10.0, 15.0, 16.0, 14.0, 24.0, 29.0, 25.0, 27.0, 34.0, 42.0, 50.0, 50.0, 72.0, 89.0, 457.0, 1492.0, 122.0, 66.0, 63.0, 30.0, 38.0, 45.0, 34.0, 32.0, 16.0, 25.0, 18.0, 16.0, 16.0, 12.0, 6.0, 5.0, 7.0, 1.0, 4.0, 0.0, 8.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.609375, -25.722900390625, -24.83642578125, -23.949951171875, -23.0634765625, -22.177001953125, -21.29052734375, -20.404052734375, -19.517578125, -18.631103515625, -17.74462890625, -16.858154296875, -15.9716796875, -15.085205078125, -14.19873046875, -13.312255859375, -12.42578125, -11.539306640625, -10.65283203125, -9.766357421875, -8.8798828125, -7.993408203125, -7.10693359375, -6.220458984375, -5.333984375, -4.447509765625, -3.56103515625, -2.674560546875, -1.7880859375, -0.901611328125, -0.01513671875, 0.871337890625, 1.7578125, 2.644287109375, 3.53076171875, 4.417236328125, 5.3037109375, 6.190185546875, 7.07666015625, 7.963134765625, 8.849609375, 9.736083984375, 10.62255859375, 11.509033203125, 12.3955078125, 13.281982421875, 14.16845703125, 15.054931640625, 15.94140625, 16.827880859375, 17.71435546875, 18.600830078125, 19.4873046875, 20.373779296875, 21.26025390625, 22.146728515625, 23.033203125, 23.919677734375, 24.80615234375, 25.692626953125, 26.5791015625, 27.465576171875, 28.35205078125, 29.238525390625, 30.125]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 7.0, 2.0, 6.0, 6.0, 7.0, 5.0, 11.0, 17.0, 21.0, 33.0, 40.0, 46.0, 68.0, 95.0, 133.0, 273.0, 501.0, 1874.0, 20264.0, 3030971.0, 85883.0, 3770.0, 681.0, 360.0, 175.0, 119.0, 84.0, 60.0, 51.0, 26.0, 22.0, 21.0, 13.0, 17.0, 12.0, 6.0, 4.0, 4.0, 7.0, 6.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-61.5, -59.7265625, -57.953125, -56.1796875, -54.40625, -52.6328125, -50.859375, -49.0859375, -47.3125, -45.5390625, -43.765625, -41.9921875, -40.21875, -38.4453125, -36.671875, -34.8984375, -33.125, -31.3515625, -29.578125, -27.8046875, -26.03125, -24.2578125, -22.484375, -20.7109375, -18.9375, -17.1640625, -15.390625, -13.6171875, -11.84375, -10.0703125, -8.296875, -6.5234375, -4.75, -2.9765625, -1.203125, 0.5703125, 2.34375, 4.1171875, 5.890625, 7.6640625, 9.4375, 11.2109375, 12.984375, 14.7578125, 16.53125, 18.3046875, 20.078125, 21.8515625, 23.625, 25.3984375, 27.171875, 28.9453125, 30.71875, 32.4921875, 34.265625, 36.0390625, 37.8125, 39.5859375, 41.359375, 43.1328125, 44.90625, 46.6796875, 48.453125, 50.2265625, 52.0]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 22.0, 624.0, 361.0, 11.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.44829559326172, -67.84322357177734, -59.23815155029297, -50.63307571411133, -42.02800369262695, -33.42293167114258, -24.817855834960938, -16.212783813476562, -7.6077117919921875, 0.9973611831665039, 9.602434158325195, 18.207508087158203, 26.812580108642578, 35.41765213012695, 44.022727966308594, 52.62779998779297, 61.232872009277344, 69.83794403076172, 78.4430160522461, 87.048095703125, 95.65316772460938, 104.25823974609375, 112.86331176757812, 121.4683837890625, 130.07345581054688, 138.67852783203125, 147.28359985351562, 155.888671875, 164.49374389648438, 173.09881591796875, 181.70388793945312, 190.3089599609375, 198.91403198242188, 207.51910400390625, 216.12417602539062, 224.729248046875, 233.33432006835938, 241.93939208984375, 250.54446411132812, 259.1495361328125, 267.7546081542969, 276.35968017578125, 284.9647521972656, 293.56982421875, 302.1748962402344, 310.77996826171875, 319.3850402832031, 327.9901123046875, 336.59521484375, 345.2002868652344, 353.80535888671875, 362.4104309082031, 371.0155029296875, 379.6205749511719, 388.22564697265625, 396.8307189941406, 405.435791015625, 414.0408630371094, 422.64593505859375, 431.2510070800781, 439.8560791015625, 448.4611511230469, 457.06622314453125, 465.6712951660156, 474.2763671875]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 3.0, 6.0, 3.0, 5.0, 6.0, 8.0, 9.0, 8.0, 15.0, 17.0, 15.0, 24.0, 19.0, 23.0, 21.0, 34.0, 31.0, 39.0, 30.0, 37.0, 37.0, 40.0, 30.0, 41.0, 34.0, 43.0, 38.0, 30.0, 32.0, 34.0, 26.0, 34.0, 33.0, 30.0, 27.0, 22.0, 24.0, 15.0, 17.0, 8.0, 13.0, 12.0, 9.0, 7.0, 4.0, 2.0, 7.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0], "bins": [-74.39491271972656, -72.0333480834961, -69.6717758178711, -67.31021118164062, -64.94864654541016, -62.58707809448242, -60.22550964355469, -57.86394500732422, -55.502376556396484, -53.14080810546875, -50.77924346923828, -48.41767501831055, -46.05610656738281, -43.694541931152344, -41.33297348022461, -38.971405029296875, -36.609840393066406, -34.24827194213867, -31.886707305908203, -29.52513885498047, -27.163572311401367, -24.802005767822266, -22.44043731689453, -20.07887077331543, -17.717304229736328, -15.355737686157227, -12.994170188903809, -10.63260269165039, -8.271036148071289, -5.9094696044921875, -3.5479021072387695, -1.1863346099853516, 1.1752243041992188, 3.5367913246154785, 5.898358345031738, 8.259925842285156, 10.621492385864258, 12.98305892944336, 15.344626426696777, 17.706193923950195, 20.067760467529297, 22.4293270111084, 24.7908935546875, 27.152462005615234, 29.514028549194336, 31.875595092773438, 34.23716354370117, 36.598731994628906, 38.960296630859375, 41.32186508178711, 43.68342971801758, 46.04499816894531, 48.40656280517578, 50.768131256103516, 53.12969970703125, 55.49126434326172, 57.85283279418945, 60.21440124511719, 62.575965881347656, 64.93753051757812, 67.29910278320312, 69.6606674194336, 72.02223205566406, 74.38380432128906, 76.74536895751953]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 1.0, 3.0, 4.0, 4.0, 6.0, 9.0, 7.0, 7.0, 9.0, 18.0, 13.0, 13.0, 10.0, 18.0, 29.0, 28.0, 38.0, 34.0, 31.0, 40.0, 37.0, 35.0, 36.0, 39.0, 50.0, 40.0, 40.0, 41.0, 44.0, 34.0, 30.0, 32.0, 31.0, 33.0, 22.0, 27.0, 18.0, 12.0, 10.0, 23.0, 11.0, 8.0, 6.0, 7.0, 5.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-7.60546875, -7.364013671875, -7.12255859375, -6.881103515625, -6.6396484375, -6.398193359375, -6.15673828125, -5.915283203125, -5.673828125, -5.432373046875, -5.19091796875, -4.949462890625, -4.7080078125, -4.466552734375, -4.22509765625, -3.983642578125, -3.7421875, -3.500732421875, -3.25927734375, -3.017822265625, -2.7763671875, -2.534912109375, -2.29345703125, -2.052001953125, -1.810546875, -1.569091796875, -1.32763671875, -1.086181640625, -0.8447265625, -0.603271484375, -0.36181640625, -0.120361328125, 0.12109375, 0.362548828125, 0.60400390625, 0.845458984375, 1.0869140625, 1.328369140625, 1.56982421875, 1.811279296875, 2.052734375, 2.294189453125, 2.53564453125, 2.777099609375, 3.0185546875, 3.260009765625, 3.50146484375, 3.742919921875, 3.984375, 4.225830078125, 4.46728515625, 4.708740234375, 4.9501953125, 5.191650390625, 5.43310546875, 5.674560546875, 5.916015625, 6.157470703125, 6.39892578125, 6.640380859375, 6.8818359375, 7.123291015625, 7.36474609375, 7.606201171875, 7.84765625]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 5.0, 5.0, 6.0, 6.0, 10.0, 14.0, 21.0, 41.0, 47.0, 73.0, 130.0, 192.0, 298.0, 540.0, 1009.0, 1987.0, 3881.0, 8435.0, 18866.0, 44693.0, 119238.0, 368308.0, 1062786.0, 1474788.0, 721273.0, 230729.0, 79526.0, 31275.0, 13562.0, 6160.0, 2980.0, 1525.0, 787.0, 418.0, 262.0, 156.0, 85.0, 54.0, 39.0, 29.0, 17.0, 12.0, 8.0, 6.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.75, -9.4481201171875, -9.146240234375, -8.8443603515625, -8.54248046875, -8.2406005859375, -7.938720703125, -7.6368408203125, -7.3349609375, -7.0330810546875, -6.731201171875, -6.4293212890625, -6.12744140625, -5.8255615234375, -5.523681640625, -5.2218017578125, -4.919921875, -4.6180419921875, -4.316162109375, -4.0142822265625, -3.71240234375, -3.4105224609375, -3.108642578125, -2.8067626953125, -2.5048828125, -2.2030029296875, -1.901123046875, -1.5992431640625, -1.29736328125, -0.9954833984375, -0.693603515625, -0.3917236328125, -0.08984375, 0.2120361328125, 0.513916015625, 0.8157958984375, 1.11767578125, 1.4195556640625, 1.721435546875, 2.0233154296875, 2.3251953125, 2.6270751953125, 2.928955078125, 3.2308349609375, 3.53271484375, 3.8345947265625, 4.136474609375, 4.4383544921875, 4.740234375, 5.0421142578125, 5.343994140625, 5.6458740234375, 5.94775390625, 6.2496337890625, 6.551513671875, 6.8533935546875, 7.1552734375, 7.4571533203125, 7.759033203125, 8.0609130859375, 8.36279296875, 8.6646728515625, 8.966552734375, 9.2684326171875, 9.5703125]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 5.0, 2.0, 4.0, 8.0, 12.0, 18.0, 16.0, 19.0, 39.0, 32.0, 48.0, 72.0, 96.0, 145.0, 185.0, 198.0, 272.0, 360.0, 423.0, 418.0, 403.0, 295.0, 234.0, 187.0, 140.0, 120.0, 81.0, 61.0, 56.0, 47.0, 21.0, 20.0, 14.0, 10.0, 5.0, 1.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.6875, -20.1314697265625, -19.575439453125, -19.0194091796875, -18.46337890625, -17.9073486328125, -17.351318359375, -16.7952880859375, -16.2392578125, -15.6832275390625, -15.127197265625, -14.5711669921875, -14.01513671875, -13.4591064453125, -12.903076171875, -12.3470458984375, -11.791015625, -11.2349853515625, -10.678955078125, -10.1229248046875, -9.56689453125, -9.0108642578125, -8.454833984375, -7.8988037109375, -7.3427734375, -6.7867431640625, -6.230712890625, -5.6746826171875, -5.11865234375, -4.5626220703125, -4.006591796875, -3.4505615234375, -2.89453125, -2.3385009765625, -1.782470703125, -1.2264404296875, -0.67041015625, -0.1143798828125, 0.441650390625, 0.9976806640625, 1.5537109375, 2.1097412109375, 2.665771484375, 3.2218017578125, 3.77783203125, 4.3338623046875, 4.889892578125, 5.4459228515625, 6.001953125, 6.5579833984375, 7.114013671875, 7.6700439453125, 8.22607421875, 8.7821044921875, 9.338134765625, 9.8941650390625, 10.4501953125, 11.0062255859375, 11.562255859375, 12.1182861328125, 12.67431640625, 13.2303466796875, 13.786376953125, 14.3424072265625, 14.8984375]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 5.0, 4.0, 9.0, 6.0, 3.0, 23.0, 27.0, 26.0, 30.0, 46.0, 76.0, 154.0, 256.0, 585.0, 1739.0, 6601.0, 33569.0, 237770.0, 2194158.0, 1529738.0, 158132.0, 23822.0, 4996.0, 1362.0, 476.0, 221.0, 123.0, 97.0, 64.0, 40.0, 31.0, 11.0, 24.0, 16.0, 12.0, 11.0, 3.0, 4.0, 5.0, 0.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.15625, -31.11572265625, -30.0751953125, -29.03466796875, -27.994140625, -26.95361328125, -25.9130859375, -24.87255859375, -23.83203125, -22.79150390625, -21.7509765625, -20.71044921875, -19.669921875, -18.62939453125, -17.5888671875, -16.54833984375, -15.5078125, -14.46728515625, -13.4267578125, -12.38623046875, -11.345703125, -10.30517578125, -9.2646484375, -8.22412109375, -7.18359375, -6.14306640625, -5.1025390625, -4.06201171875, -3.021484375, -1.98095703125, -0.9404296875, 0.10009765625, 1.140625, 2.18115234375, 3.2216796875, 4.26220703125, 5.302734375, 6.34326171875, 7.3837890625, 8.42431640625, 9.46484375, 10.50537109375, 11.5458984375, 12.58642578125, 13.626953125, 14.66748046875, 15.7080078125, 16.74853515625, 17.7890625, 18.82958984375, 19.8701171875, 20.91064453125, 21.951171875, 22.99169921875, 24.0322265625, 25.07275390625, 26.11328125, 27.15380859375, 28.1943359375, 29.23486328125, 30.275390625, 31.31591796875, 32.3564453125, 33.39697265625, 34.4375]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 9.0, 14.0, 47.0, 85.0, 150.0, 213.0, 213.0, 110.0, 106.0, 43.0, 16.0, 6.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-280.083740234375, -274.2662658691406, -268.4487609863281, -262.63128662109375, -256.8138122558594, -250.99632263183594, -245.1788330078125, -239.36135864257812, -233.54388427734375, -227.7263946533203, -221.90892028808594, -216.0914306640625, -210.27395629882812, -204.4564666748047, -198.63897705078125, -192.82150268554688, -187.00401306152344, -181.1865234375, -175.36904907226562, -169.5515594482422, -163.7340850830078, -157.91659545898438, -152.09912109375, -146.28163146972656, -140.46414184570312, -134.6466522216797, -128.8291778564453, -123.01168823242188, -117.1942138671875, -111.37672424316406, -105.55924224853516, -99.74176025390625, -93.92427825927734, -88.10679626464844, -82.28931427001953, -76.47183227539062, -70.65434265136719, -64.83686828613281, -59.019378662109375, -53.20189666748047, -47.38441467285156, -41.566932678222656, -35.74945068359375, -29.931964874267578, -24.114482879638672, -18.297000885009766, -12.479515075683594, -6.6620330810546875, -0.8445510864257812, 4.972931861877441, 10.790414810180664, 16.607898712158203, 22.42538070678711, 28.242862701416016, 34.06034851074219, 39.877830505371094, 45.6953125, 51.512794494628906, 57.33027648925781, 63.147762298583984, 68.96524047851562, 74.78273010253906, 80.60021209716797, 86.41769409179688, 92.23517608642578]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 5.0, 3.0, 7.0, 9.0, 8.0, 7.0, 15.0, 27.0, 15.0, 21.0, 19.0, 15.0, 31.0, 28.0, 51.0, 42.0, 38.0, 45.0, 46.0, 38.0, 56.0, 52.0, 48.0, 34.0, 42.0, 40.0, 28.0, 39.0, 29.0, 35.0, 30.0, 21.0, 13.0, 18.0, 14.0, 12.0, 8.0, 3.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-69.48068237304688, -67.33245086669922, -65.18421936035156, -63.03598403930664, -60.887752532958984, -58.73952102661133, -56.591285705566406, -54.44305419921875, -52.294822692871094, -50.14659118652344, -47.99835968017578, -45.85012435913086, -43.7018928527832, -41.55366134643555, -39.405426025390625, -37.25719451904297, -35.10896301269531, -32.960731506347656, -30.812498092651367, -28.664264678955078, -26.516033172607422, -24.367801666259766, -22.219568252563477, -20.071334838867188, -17.92310333251953, -15.774870872497559, -13.626638412475586, -11.478405952453613, -9.33017349243164, -7.181941032409668, -5.033708572387695, -2.8854761123657227, -0.73724365234375, 1.4109888076782227, 3.5592212677001953, 5.707453727722168, 7.855686187744141, 10.003918647766113, 12.152151107788086, 14.300383567810059, 16.44861602783203, 18.596847534179688, 20.745080947875977, 22.893314361572266, 25.041545867919922, 27.189777374267578, 29.338010787963867, 31.486244201660156, 33.63447570800781, 35.78270721435547, 37.930938720703125, 40.07917404174805, 42.2274055480957, 44.37563705444336, 46.52387237548828, 48.67210388183594, 50.820335388183594, 52.96856689453125, 55.116798400878906, 57.26503372192383, 59.413265228271484, 61.56149673461914, 63.70973205566406, 65.85796356201172, 68.00619506835938]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 8.0, 4.0, 5.0, 7.0, 9.0, 4.0, 7.0, 14.0, 18.0, 16.0, 14.0, 21.0, 20.0, 21.0, 33.0, 40.0, 31.0, 42.0, 36.0, 24.0, 52.0, 41.0, 54.0, 49.0, 40.0, 50.0, 38.0, 35.0, 27.0, 32.0, 35.0, 23.0, 25.0, 26.0, 19.0, 16.0, 12.0, 12.0, 12.0, 6.0, 7.0, 3.0, 5.0, 3.0, 1.0, 3.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.45703125, -7.20367431640625, -6.9503173828125, -6.69696044921875, -6.443603515625, -6.19024658203125, -5.9368896484375, -5.68353271484375, -5.43017578125, -5.17681884765625, -4.9234619140625, -4.67010498046875, -4.416748046875, -4.16339111328125, -3.9100341796875, -3.65667724609375, -3.4033203125, -3.14996337890625, -2.8966064453125, -2.64324951171875, -2.389892578125, -2.13653564453125, -1.8831787109375, -1.62982177734375, -1.37646484375, -1.12310791015625, -0.8697509765625, -0.61639404296875, -0.363037109375, -0.10968017578125, 0.1436767578125, 0.39703369140625, 0.650390625, 0.90374755859375, 1.1571044921875, 1.41046142578125, 1.663818359375, 1.91717529296875, 2.1705322265625, 2.42388916015625, 2.67724609375, 2.93060302734375, 3.1839599609375, 3.43731689453125, 3.690673828125, 3.94403076171875, 4.1973876953125, 4.45074462890625, 4.7041015625, 4.95745849609375, 5.2108154296875, 5.46417236328125, 5.717529296875, 5.97088623046875, 6.2242431640625, 6.47760009765625, 6.73095703125, 6.98431396484375, 7.2376708984375, 7.49102783203125, 7.744384765625, 7.99774169921875, 8.2510986328125, 8.50445556640625, 8.7578125]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 7.0, 16.0, 27.0, 34.0, 56.0, 117.0, 162.0, 168.0, 318.0, 461.0, 681.0, 951.0, 1363.0, 1931.0, 2802.0, 3969.0, 6015.0, 8614.0, 12597.0, 18359.0, 27498.0, 39687.0, 59133.0, 87003.0, 121040.0, 149339.0, 144519.0, 112661.0, 79449.0, 53941.0, 36977.0, 24941.0, 16879.0, 11403.0, 7803.0, 5382.0, 3870.0, 2587.0, 1793.0, 1290.0, 873.0, 576.0, 405.0, 296.0, 197.0, 154.0, 89.0, 53.0, 31.0, 23.0, 8.0, 8.0, 4.0, 1.0, 2.0, 1.0], "bins": [-0.5595703125, -0.5430564880371094, -0.5265426635742188, -0.5100288391113281, -0.4935150146484375, -0.4770011901855469, -0.46048736572265625, -0.4439735412597656, -0.427459716796875, -0.4109458923339844, -0.39443206787109375, -0.3779182434082031, -0.3614044189453125, -0.3448905944824219, -0.32837677001953125, -0.3118629455566406, -0.29534912109375, -0.2788352966308594, -0.26232147216796875, -0.24580764770507812, -0.2292938232421875, -0.21277999877929688, -0.19626617431640625, -0.17975234985351562, -0.163238525390625, -0.14672470092773438, -0.13021087646484375, -0.11369705200195312, -0.0971832275390625, -0.08066940307617188, -0.06415557861328125, -0.047641754150390625, -0.0311279296875, -0.014614105224609375, 0.00189971923828125, 0.018413543701171875, 0.0349273681640625, 0.051441192626953125, 0.06795501708984375, 0.08446884155273438, 0.100982666015625, 0.11749649047851562, 0.13401031494140625, 0.15052413940429688, 0.1670379638671875, 0.18355178833007812, 0.20006561279296875, 0.21657943725585938, 0.23309326171875, 0.24960708618164062, 0.26612091064453125, 0.2826347351074219, 0.2991485595703125, 0.3156623840332031, 0.33217620849609375, 0.3486900329589844, 0.365203857421875, 0.3817176818847656, 0.39823150634765625, 0.4147453308105469, 0.4312591552734375, 0.4477729797363281, 0.46428680419921875, 0.4808006286621094, 0.497314453125]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 5.0, 3.0, 11.0, 3.0, 10.0, 15.0, 11.0, 13.0, 14.0, 16.0, 28.0, 25.0, 33.0, 33.0, 26.0, 40.0, 36.0, 36.0, 57.0, 55.0, 1070.0, 52.0, 50.0, 49.0, 40.0, 35.0, 31.0, 31.0, 23.0, 36.0, 29.0, 26.0, 17.0, 12.0, 14.0, 8.0, 7.0, 7.0, 4.0, 7.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-6.18359375, -6.01458740234375, -5.8455810546875, -5.67657470703125, -5.507568359375, -5.33856201171875, -5.1695556640625, -5.00054931640625, -4.83154296875, -4.66253662109375, -4.4935302734375, -4.32452392578125, -4.155517578125, -3.98651123046875, -3.8175048828125, -3.64849853515625, -3.4794921875, -3.31048583984375, -3.1414794921875, -2.97247314453125, -2.803466796875, -2.63446044921875, -2.4654541015625, -2.29644775390625, -2.12744140625, -1.95843505859375, -1.7894287109375, -1.62042236328125, -1.451416015625, -1.28240966796875, -1.1134033203125, -0.94439697265625, -0.775390625, -0.60638427734375, -0.4373779296875, -0.26837158203125, -0.099365234375, 0.06964111328125, 0.2386474609375, 0.40765380859375, 0.57666015625, 0.74566650390625, 0.9146728515625, 1.08367919921875, 1.252685546875, 1.42169189453125, 1.5906982421875, 1.75970458984375, 1.9287109375, 2.09771728515625, 2.2667236328125, 2.43572998046875, 2.604736328125, 2.77374267578125, 2.9427490234375, 3.11175537109375, 3.28076171875, 3.44976806640625, 3.6187744140625, 3.78778076171875, 3.956787109375, 4.12579345703125, 4.2947998046875, 4.46380615234375, 4.6328125]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 3.0, 3.0, 6.0, 6.0, 5.0, 18.0, 24.0, 45.0, 43.0, 77.0, 108.0, 129.0, 223.0, 315.0, 530.0, 784.0, 1207.0, 1827.0, 2910.0, 4670.0, 7056.0, 11765.0, 18736.0, 29377.0, 46086.0, 70792.0, 102791.0, 139155.0, 1192414.0, 148541.0, 107813.0, 74735.0, 49143.0, 31318.0, 19846.0, 12652.0, 7885.0, 5083.0, 3112.0, 2028.0, 1335.0, 847.0, 535.0, 374.0, 231.0, 160.0, 132.0, 95.0, 57.0, 40.0, 24.0, 12.0, 12.0, 7.0, 8.0, 6.0, 1.0, 0.0, 4.0, 3.0], "bins": [-0.408203125, -0.3956718444824219, -0.38314056396484375, -0.3706092834472656, -0.3580780029296875, -0.3455467224121094, -0.33301544189453125, -0.3204841613769531, -0.307952880859375, -0.2954216003417969, -0.28289031982421875, -0.2703590393066406, -0.2578277587890625, -0.24529647827148438, -0.23276519775390625, -0.22023391723632812, -0.20770263671875, -0.19517135620117188, -0.18264007568359375, -0.17010879516601562, -0.1575775146484375, -0.14504623413085938, -0.13251495361328125, -0.11998367309570312, -0.107452392578125, -0.09492111206054688, -0.08238983154296875, -0.06985855102539062, -0.0573272705078125, -0.044795989990234375, -0.03226470947265625, -0.019733428955078125, -0.0072021484375, 0.005329132080078125, 0.01786041259765625, 0.030391693115234375, 0.0429229736328125, 0.055454254150390625, 0.06798553466796875, 0.08051681518554688, 0.093048095703125, 0.10557937622070312, 0.11811065673828125, 0.13064193725585938, 0.1431732177734375, 0.15570449829101562, 0.16823577880859375, 0.18076705932617188, 0.19329833984375, 0.20582962036132812, 0.21836090087890625, 0.23089218139648438, 0.2434234619140625, 0.2559547424316406, 0.26848602294921875, 0.2810173034667969, 0.293548583984375, 0.3060798645019531, 0.31861114501953125, 0.3311424255371094, 0.3436737060546875, 0.3562049865722656, 0.36873626708984375, 0.3812675476074219, 0.393798828125]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 4.0, 3.0, 7.0, 5.0, 6.0, 5.0, 11.0, 14.0, 10.0, 15.0, 21.0, 26.0, 45.0, 31.0, 50.0, 64.0, 67.0, 91.0, 102.0, 83.0, 60.0, 51.0, 48.0, 36.0, 30.0, 25.0, 20.0, 12.0, 18.0, 9.0, 9.0, 7.0, 8.0, 2.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00970458984375, -0.009337902069091797, -0.008971214294433594, -0.00860452651977539, -0.008237838745117188, -0.007871150970458984, -0.007504463195800781, -0.007137775421142578, -0.006771087646484375, -0.006404399871826172, -0.006037712097167969, -0.005671024322509766, -0.0053043365478515625, -0.004937648773193359, -0.004570960998535156, -0.004204273223876953, -0.00383758544921875, -0.003470897674560547, -0.0031042098999023438, -0.0027375221252441406, -0.0023708343505859375, -0.0020041465759277344, -0.0016374588012695312, -0.0012707710266113281, -0.000904083251953125, -0.0005373954772949219, -0.00017070770263671875, 0.00019598007202148438, 0.0005626678466796875, 0.0009293556213378906, 0.0012960433959960938, 0.0016627311706542969, 0.0020294189453125, 0.002396106719970703, 0.0027627944946289062, 0.0031294822692871094, 0.0034961700439453125, 0.0038628578186035156, 0.004229545593261719, 0.004596233367919922, 0.004962921142578125, 0.005329608917236328, 0.005696296691894531, 0.006062984466552734, 0.0064296722412109375, 0.006796360015869141, 0.007163047790527344, 0.007529735565185547, 0.00789642333984375, 0.008263111114501953, 0.008629798889160156, 0.00899648666381836, 0.009363174438476562, 0.009729862213134766, 0.010096549987792969, 0.010463237762451172, 0.010829925537109375, 0.011196613311767578, 0.011563301086425781, 0.011929988861083984, 0.012296676635742188, 0.01266336441040039, 0.013030052185058594, 0.013396739959716797, 0.013763427734375]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 7.0, 3.0, 4.0, 8.0, 10.0, 13.0, 16.0, 32.0, 45.0, 61.0, 88.0, 133.0, 234.0, 455.0, 2167.0, 571993.0, 470128.0, 2070.0, 430.0, 235.0, 133.0, 87.0, 69.0, 33.0, 25.0, 20.0, 16.0, 8.0, 6.0, 5.0, 8.0, 4.0, 6.0, 5.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2432861328125, -0.2361278533935547, -0.22896957397460938, -0.22181129455566406, -0.21465301513671875, -0.20749473571777344, -0.20033645629882812, -0.1931781768798828, -0.1860198974609375, -0.1788616180419922, -0.17170333862304688, -0.16454505920410156, -0.15738677978515625, -0.15022850036621094, -0.14307022094726562, -0.1359119415283203, -0.128753662109375, -0.12159538269042969, -0.11443710327148438, -0.10727882385253906, -0.10012054443359375, -0.09296226501464844, -0.08580398559570312, -0.07864570617675781, -0.0714874267578125, -0.06432914733886719, -0.057170867919921875, -0.05001258850097656, -0.04285430908203125, -0.03569602966308594, -0.028537750244140625, -0.021379470825195312, -0.01422119140625, -0.0070629119873046875, 9.5367431640625e-05, 0.0072536468505859375, 0.01441192626953125, 0.021570205688476562, 0.028728485107421875, 0.03588676452636719, 0.0430450439453125, 0.05020332336425781, 0.057361602783203125, 0.06451988220214844, 0.07167816162109375, 0.07883644104003906, 0.08599472045898438, 0.09315299987792969, 0.100311279296875, 0.10746955871582031, 0.11462783813476562, 0.12178611755371094, 0.12894439697265625, 0.13610267639160156, 0.14326095581054688, 0.1504192352294922, 0.1575775146484375, 0.1647357940673828, 0.17189407348632812, 0.17905235290527344, 0.18621063232421875, 0.19336891174316406, 0.20052719116210938, 0.2076854705810547, 0.21484375]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 40.0, 348.0, 496.0, 118.0, 12.0, 0.0, 1.0, 1.0], "bins": [-0.07492337375879288, -0.07363671809434891, -0.07235006242990494, -0.07106341421604156, -0.0697767585515976, -0.06849010288715363, -0.06720344722270966, -0.06591679155826569, -0.06463013589382172, -0.06334348022937775, -0.062056828290224075, -0.060770172625780106, -0.059483520686626434, -0.058196865022182465, -0.056910209357738495, -0.055623553693294525, -0.05433690547943115, -0.05305024981498718, -0.05176359787583351, -0.05047694221138954, -0.04919029027223587, -0.0479036346077919, -0.04661697894334793, -0.04533032327890396, -0.04404367133975029, -0.04275701567530632, -0.04147036373615265, -0.04018370807170868, -0.03889705240726471, -0.03761040046811104, -0.03632374480366707, -0.0350370928645134, -0.03375043720006943, -0.03246378153562546, -0.031177129596471786, -0.029890473932027817, -0.028603820130228996, -0.027317166328430176, -0.026030510663986206, -0.024743856862187386, -0.023457204923033714, -0.022170551121234894, -0.020883895456790924, -0.019597241654992104, -0.018310587853193283, -0.017023934051394463, -0.015737280249595642, -0.014450624585151672, -0.013163970783352852, -0.011877316981554031, -0.010590662248432636, -0.009304007515311241, -0.00801735371351242, -0.006730699446052313, -0.005444045178592205, -0.00415739044547081, -0.002870736178010702, -0.0015840819105505943, -0.0002974276430904865, 0.0009892266243696213, 0.002275880891829729, 0.003562535159289837, 0.004849189426749945, 0.00613584415987134, 0.00742249796167016]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 7.0, 2.0, 3.0, 3.0, 3.0, 3.0, 12.0, 13.0, 9.0, 21.0, 16.0, 24.0, 17.0, 21.0, 21.0, 30.0, 36.0, 34.0, 30.0, 39.0, 45.0, 37.0, 40.0, 42.0, 37.0, 40.0, 33.0, 34.0, 44.0, 38.0, 24.0, 28.0, 32.0, 16.0, 25.0, 33.0, 17.0, 18.0, 18.0, 15.0, 8.0, 8.0, 5.0, 10.0, 7.0, 3.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.005651652812957764, -0.005479979328811169, -0.005308305844664574, -0.005136632360517979, -0.004964958876371384, -0.004793285392224789, -0.004621611908078194, -0.004449938423931599, -0.004278264939785004, -0.004106591455638409, -0.003934917971491814, -0.0037632444873452187, -0.0035915710031986237, -0.0034198975190520287, -0.0032482240349054337, -0.0030765505507588387, -0.0029048770666122437, -0.0027332035824656487, -0.0025615300983190536, -0.0023898566141724586, -0.0022181831300258636, -0.0020465096458792686, -0.0018748361617326736, -0.0017031626775860786, -0.0015314891934394836, -0.0013598157092928886, -0.0011881422251462936, -0.0010164687409996986, -0.0008447952568531036, -0.0006731217727065086, -0.0005014482885599136, -0.00032977480441331863, -0.00015810132026672363, 1.3572163879871368e-05, 0.00018524564802646637, 0.00035691913217306137, 0.0005285926163196564, 0.0007002661004662514, 0.0008719395846128464, 0.0010436130687594414, 0.0012152865529060364, 0.0013869600370526314, 0.0015586335211992264, 0.0017303070053458214, 0.0019019804894924164, 0.0020736539736390114, 0.0022453274577856064, 0.0024170009419322014, 0.0025886744260787964, 0.0027603479102253914, 0.0029320213943719864, 0.0031036948785185814, 0.0032753683626651764, 0.0034470418468117714, 0.0036187153309583664, 0.0037903888151049614, 0.003962062299251556, 0.004133735783398151, 0.004305409267544746, 0.004477082751691341, 0.004648756235837936, 0.004820429719984531, 0.004992103204131126, 0.005163776688277721, 0.005335450172424316]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 8.0, 4.0, 5.0, 7.0, 9.0, 4.0, 7.0, 14.0, 18.0, 16.0, 14.0, 21.0, 20.0, 21.0, 33.0, 40.0, 31.0, 42.0, 36.0, 24.0, 52.0, 41.0, 54.0, 49.0, 40.0, 50.0, 38.0, 35.0, 27.0, 32.0, 35.0, 23.0, 25.0, 26.0, 19.0, 15.0, 12.0, 13.0, 12.0, 6.0, 7.0, 3.0, 5.0, 3.0, 1.0, 3.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.45703125, -7.20367431640625, -6.9503173828125, -6.69696044921875, -6.443603515625, -6.19024658203125, -5.9368896484375, -5.68353271484375, -5.43017578125, -5.17681884765625, -4.9234619140625, -4.67010498046875, -4.416748046875, -4.16339111328125, -3.9100341796875, -3.65667724609375, -3.4033203125, -3.14996337890625, -2.8966064453125, -2.64324951171875, -2.389892578125, -2.13653564453125, -1.8831787109375, -1.62982177734375, -1.37646484375, -1.12310791015625, -0.8697509765625, -0.61639404296875, -0.363037109375, -0.10968017578125, 0.1436767578125, 0.39703369140625, 0.650390625, 0.90374755859375, 1.1571044921875, 1.41046142578125, 1.663818359375, 1.91717529296875, 2.1705322265625, 2.42388916015625, 2.67724609375, 2.93060302734375, 3.1839599609375, 3.43731689453125, 3.690673828125, 3.94403076171875, 4.1973876953125, 4.45074462890625, 4.7041015625, 4.95745849609375, 5.2108154296875, 5.46417236328125, 5.717529296875, 5.97088623046875, 6.2242431640625, 6.47760009765625, 6.73095703125, 6.98431396484375, 7.2376708984375, 7.49102783203125, 7.744384765625, 7.99774169921875, 8.2510986328125, 8.50445556640625, 8.7578125]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 5.0, 7.0, 6.0, 15.0, 14.0, 36.0, 39.0, 64.0, 79.0, 119.0, 162.0, 282.0, 404.0, 605.0, 1041.0, 1752.0, 2979.0, 5210.0, 9540.0, 18707.0, 41847.0, 113584.0, 365379.0, 314563.0, 97533.0, 36833.0, 16955.0, 8614.0, 4912.0, 2829.0, 1676.0, 1013.0, 613.0, 370.0, 232.0, 181.0, 111.0, 70.0, 52.0, 38.0, 25.0, 23.0, 12.0, 7.0, 5.0, 7.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.73828125, -5.54656982421875, -5.3548583984375, -5.16314697265625, -4.971435546875, -4.77972412109375, -4.5880126953125, -4.39630126953125, -4.20458984375, -4.01287841796875, -3.8211669921875, -3.62945556640625, -3.437744140625, -3.24603271484375, -3.0543212890625, -2.86260986328125, -2.6708984375, -2.47918701171875, -2.2874755859375, -2.09576416015625, -1.904052734375, -1.71234130859375, -1.5206298828125, -1.32891845703125, -1.13720703125, -0.94549560546875, -0.7537841796875, -0.56207275390625, -0.370361328125, -0.17864990234375, 0.0130615234375, 0.20477294921875, 0.396484375, 0.58819580078125, 0.7799072265625, 0.97161865234375, 1.163330078125, 1.35504150390625, 1.5467529296875, 1.73846435546875, 1.93017578125, 2.12188720703125, 2.3135986328125, 2.50531005859375, 2.697021484375, 2.88873291015625, 3.0804443359375, 3.27215576171875, 3.4638671875, 3.65557861328125, 3.8472900390625, 4.03900146484375, 4.230712890625, 4.42242431640625, 4.6141357421875, 4.80584716796875, 4.99755859375, 5.18927001953125, 5.3809814453125, 5.57269287109375, 5.764404296875, 5.95611572265625, 6.1478271484375, 6.33953857421875, 6.53125]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 6.0, 5.0, 5.0, 5.0, 14.0, 13.0, 16.0, 9.0, 17.0, 21.0, 26.0, 33.0, 42.0, 41.0, 45.0, 64.0, 76.0, 293.0, 1702.0, 166.0, 76.0, 77.0, 56.0, 42.0, 32.0, 31.0, 26.0, 23.0, 24.0, 14.0, 13.0, 12.0, 5.0, 12.0, 5.0, 0.0, 1.0, 6.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.65625, -38.46337890625, -37.2705078125, -36.07763671875, -34.884765625, -33.69189453125, -32.4990234375, -31.30615234375, -30.11328125, -28.92041015625, -27.7275390625, -26.53466796875, -25.341796875, -24.14892578125, -22.9560546875, -21.76318359375, -20.5703125, -19.37744140625, -18.1845703125, -16.99169921875, -15.798828125, -14.60595703125, -13.4130859375, -12.22021484375, -11.02734375, -9.83447265625, -8.6416015625, -7.44873046875, -6.255859375, -5.06298828125, -3.8701171875, -2.67724609375, -1.484375, -0.29150390625, 0.9013671875, 2.09423828125, 3.287109375, 4.47998046875, 5.6728515625, 6.86572265625, 8.05859375, 9.25146484375, 10.4443359375, 11.63720703125, 12.830078125, 14.02294921875, 15.2158203125, 16.40869140625, 17.6015625, 18.79443359375, 19.9873046875, 21.18017578125, 22.373046875, 23.56591796875, 24.7587890625, 25.95166015625, 27.14453125, 28.33740234375, 29.5302734375, 30.72314453125, 31.916015625, 33.10888671875, 34.3017578125, 35.49462890625, 36.6875]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 4.0, 2.0, 2.0, 6.0, 9.0, 9.0, 14.0, 17.0, 25.0, 30.0, 34.0, 62.0, 49.0, 100.0, 153.0, 225.0, 434.0, 1170.0, 26037.0, 3102686.0, 12690.0, 951.0, 353.0, 186.0, 112.0, 96.0, 63.0, 47.0, 39.0, 24.0, 14.0, 16.0, 11.0, 17.0, 7.0, 3.0, 6.0, 5.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-73.375, -70.9638671875, -68.552734375, -66.1416015625, -63.73046875, -61.3193359375, -58.908203125, -56.4970703125, -54.0859375, -51.6748046875, -49.263671875, -46.8525390625, -44.44140625, -42.0302734375, -39.619140625, -37.2080078125, -34.796875, -32.3857421875, -29.974609375, -27.5634765625, -25.15234375, -22.7412109375, -20.330078125, -17.9189453125, -15.5078125, -13.0966796875, -10.685546875, -8.2744140625, -5.86328125, -3.4521484375, -1.041015625, 1.3701171875, 3.78125, 6.1923828125, 8.603515625, 11.0146484375, 13.42578125, 15.8369140625, 18.248046875, 20.6591796875, 23.0703125, 25.4814453125, 27.892578125, 30.3037109375, 32.71484375, 35.1259765625, 37.537109375, 39.9482421875, 42.359375, 44.7705078125, 47.181640625, 49.5927734375, 52.00390625, 54.4150390625, 56.826171875, 59.2373046875, 61.6484375, 64.0595703125, 66.470703125, 68.8818359375, 71.29296875, 73.7041015625, 76.115234375, 78.5263671875, 80.9375]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 12.0, 49.0, 123.0, 230.0, 270.0, 195.0, 96.0, 25.0, 14.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-77.53850555419922, -75.20618438720703, -72.87386322021484, -70.54153442382812, -68.20921325683594, -65.87689208984375, -63.54457092285156, -61.212249755859375, -58.87992477416992, -56.547603607177734, -54.21527862548828, -51.882957458496094, -49.550636291503906, -47.21831130981445, -44.885990142822266, -42.55366516113281, -40.221343994140625, -37.88902282714844, -35.556697845458984, -33.2243766784668, -30.892053604125977, -28.559730529785156, -26.22740936279297, -23.89508628845215, -21.562763214111328, -19.230440139770508, -16.898117065429688, -14.5657958984375, -12.23347282409668, -9.90114974975586, -7.5688276290893555, -5.236505508422852, -2.9041824340820312, -0.5718598365783691, 1.760462760925293, 4.092785358428955, 6.425107955932617, 8.757431030273438, 11.089753150939941, 13.422075271606445, 15.754398345947266, 18.086721420288086, 20.419044494628906, 22.751365661621094, 25.083688735961914, 27.416011810302734, 29.748332977294922, 32.080657958984375, 34.41297912597656, 36.74530029296875, 39.0776252746582, 41.40994644165039, 43.742271423339844, 46.07459259033203, 48.40691375732422, 50.739234924316406, 53.07155990600586, 55.40388107299805, 57.7362060546875, 60.06852722167969, 62.400848388671875, 64.73316955566406, 67.06549835205078, 69.39781951904297, 71.73014068603516]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 3.0, 4.0, 9.0, 9.0, 4.0, 10.0, 12.0, 13.0, 16.0, 9.0, 18.0, 19.0, 26.0, 29.0, 34.0, 39.0, 38.0, 49.0, 35.0, 50.0, 38.0, 54.0, 44.0, 44.0, 55.0, 26.0, 42.0, 39.0, 30.0, 38.0, 29.0, 16.0, 24.0, 21.0, 22.0, 13.0, 9.0, 6.0, 11.0, 6.0, 2.0, 6.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-86.75184631347656, -84.26504516601562, -81.77825164794922, -79.29145050048828, -76.80464935302734, -74.31785583496094, -71.8310546875, -69.34425354003906, -66.85745239257812, -64.37065124511719, -61.883853912353516, -59.397056579589844, -56.910255432128906, -54.423458099365234, -51.93666076660156, -49.449859619140625, -46.96306610107422, -44.47626876831055, -41.98946762084961, -39.50267028808594, -37.015869140625, -34.52907180786133, -32.042274475097656, -29.55547523498535, -27.068675994873047, -24.581876754760742, -22.095077514648438, -19.608280181884766, -17.12148094177246, -14.634681701660156, -12.147883415222168, -9.66108512878418, -7.174293518066406, -4.68749475479126, -2.2006959915161133, 0.2861027717590332, 2.7729015350341797, 5.259700775146484, 7.746499061584473, 10.233297348022461, 12.720096588134766, 15.20689582824707, 17.693695068359375, 20.180492401123047, 22.66729164123535, 25.154090881347656, 27.640888214111328, 30.127687454223633, 32.61448669433594, 35.10128402709961, 37.58808517456055, 40.07488250732422, 42.561683654785156, 45.04848098754883, 47.5352783203125, 50.02207946777344, 52.50887680053711, 54.99567413330078, 57.48247528076172, 59.96927261352539, 62.45606994628906, 64.94287109375, 67.42967224121094, 69.91646575927734, 72.40326690673828]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 1.0, 2.0, 3.0, 8.0, 3.0, 7.0, 7.0, 8.0, 7.0, 7.0, 14.0, 15.0, 14.0, 28.0, 20.0, 14.0, 35.0, 35.0, 37.0, 34.0, 42.0, 43.0, 39.0, 34.0, 47.0, 51.0, 46.0, 49.0, 38.0, 44.0, 29.0, 40.0, 27.0, 27.0, 19.0, 26.0, 18.0, 23.0, 10.0, 10.0, 12.0, 13.0, 5.0, 2.0, 2.0, 3.0, 3.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.1953125, -7.92822265625, -7.6611328125, -7.39404296875, -7.126953125, -6.85986328125, -6.5927734375, -6.32568359375, -6.05859375, -5.79150390625, -5.5244140625, -5.25732421875, -4.990234375, -4.72314453125, -4.4560546875, -4.18896484375, -3.921875, -3.65478515625, -3.3876953125, -3.12060546875, -2.853515625, -2.58642578125, -2.3193359375, -2.05224609375, -1.78515625, -1.51806640625, -1.2509765625, -0.98388671875, -0.716796875, -0.44970703125, -0.1826171875, 0.08447265625, 0.3515625, 0.61865234375, 0.8857421875, 1.15283203125, 1.419921875, 1.68701171875, 1.9541015625, 2.22119140625, 2.48828125, 2.75537109375, 3.0224609375, 3.28955078125, 3.556640625, 3.82373046875, 4.0908203125, 4.35791015625, 4.625, 4.89208984375, 5.1591796875, 5.42626953125, 5.693359375, 5.96044921875, 6.2275390625, 6.49462890625, 6.76171875, 7.02880859375, 7.2958984375, 7.56298828125, 7.830078125, 8.09716796875, 8.3642578125, 8.63134765625, 8.8984375]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 1.0, 2.0, 4.0, 3.0, 4.0, 7.0, 8.0, 10.0, 9.0, 12.0, 15.0, 16.0, 10.0, 25.0, 28.0, 26.0, 34.0, 53.0, 88.0, 144.0, 267.0, 750.0, 3278.0, 33066.0, 942068.0, 3063033.0, 139806.0, 9218.0, 1261.0, 410.0, 170.0, 121.0, 70.0, 60.0, 31.0, 29.0, 31.0, 19.0, 16.0, 12.0, 17.0, 15.0, 9.0, 3.0, 2.0, 5.0, 4.0, 5.0, 1.0, 4.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-33.5625, -32.521484375, -31.48046875, -30.439453125, -29.3984375, -28.357421875, -27.31640625, -26.275390625, -25.234375, -24.193359375, -23.15234375, -22.111328125, -21.0703125, -20.029296875, -18.98828125, -17.947265625, -16.90625, -15.865234375, -14.82421875, -13.783203125, -12.7421875, -11.701171875, -10.66015625, -9.619140625, -8.578125, -7.537109375, -6.49609375, -5.455078125, -4.4140625, -3.373046875, -2.33203125, -1.291015625, -0.25, 0.791015625, 1.83203125, 2.873046875, 3.9140625, 4.955078125, 5.99609375, 7.037109375, 8.078125, 9.119140625, 10.16015625, 11.201171875, 12.2421875, 13.283203125, 14.32421875, 15.365234375, 16.40625, 17.447265625, 18.48828125, 19.529296875, 20.5703125, 21.611328125, 22.65234375, 23.693359375, 24.734375, 25.775390625, 26.81640625, 27.857421875, 28.8984375, 29.939453125, 30.98046875, 32.021484375, 33.0625]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 5.0, 2.0, 15.0, 15.0, 21.0, 31.0, 74.0, 90.0, 154.0, 216.0, 290.0, 446.0, 569.0, 575.0, 498.0, 342.0, 235.0, 183.0, 105.0, 72.0, 51.0, 27.0, 20.0, 13.0, 13.0, 2.0, 6.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-29.78125, -29.001708984375, -28.22216796875, -27.442626953125, -26.6630859375, -25.883544921875, -25.10400390625, -24.324462890625, -23.544921875, -22.765380859375, -21.98583984375, -21.206298828125, -20.4267578125, -19.647216796875, -18.86767578125, -18.088134765625, -17.30859375, -16.529052734375, -15.74951171875, -14.969970703125, -14.1904296875, -13.410888671875, -12.63134765625, -11.851806640625, -11.072265625, -10.292724609375, -9.51318359375, -8.733642578125, -7.9541015625, -7.174560546875, -6.39501953125, -5.615478515625, -4.8359375, -4.056396484375, -3.27685546875, -2.497314453125, -1.7177734375, -0.938232421875, -0.15869140625, 0.620849609375, 1.400390625, 2.179931640625, 2.95947265625, 3.739013671875, 4.5185546875, 5.298095703125, 6.07763671875, 6.857177734375, 7.63671875, 8.416259765625, 9.19580078125, 9.975341796875, 10.7548828125, 11.534423828125, 12.31396484375, 13.093505859375, 13.873046875, 14.652587890625, 15.43212890625, 16.211669921875, 16.9912109375, 17.770751953125, 18.55029296875, 19.329833984375, 20.109375]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 7.0, 2.0, 15.0, 15.0, 26.0, 44.0, 60.0, 96.0, 158.0, 307.0, 659.0, 1880.0, 16639.0, 769678.0, 3325593.0, 73264.0, 3899.0, 925.0, 433.0, 243.0, 134.0, 72.0, 49.0, 27.0, 13.0, 14.0, 9.0, 9.0, 9.0, 2.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.6875, -44.6767578125, -42.666015625, -40.6552734375, -38.64453125, -36.6337890625, -34.623046875, -32.6123046875, -30.6015625, -28.5908203125, -26.580078125, -24.5693359375, -22.55859375, -20.5478515625, -18.537109375, -16.5263671875, -14.515625, -12.5048828125, -10.494140625, -8.4833984375, -6.47265625, -4.4619140625, -2.451171875, -0.4404296875, 1.5703125, 3.5810546875, 5.591796875, 7.6025390625, 9.61328125, 11.6240234375, 13.634765625, 15.6455078125, 17.65625, 19.6669921875, 21.677734375, 23.6884765625, 25.69921875, 27.7099609375, 29.720703125, 31.7314453125, 33.7421875, 35.7529296875, 37.763671875, 39.7744140625, 41.78515625, 43.7958984375, 45.806640625, 47.8173828125, 49.828125, 51.8388671875, 53.849609375, 55.8603515625, 57.87109375, 59.8818359375, 61.892578125, 63.9033203125, 65.9140625, 67.9248046875, 69.935546875, 71.9462890625, 73.95703125, 75.9677734375, 77.978515625, 79.9892578125, 82.0]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 7.0, 7.0, 34.0, 82.0, 114.0, 178.0, 204.0, 172.0, 118.0, 50.0, 34.0, 11.0, 2.0, 2.0], "bins": [-317.98980712890625, -312.3635559082031, -306.7373352050781, -301.111083984375, -295.4848327636719, -289.85858154296875, -284.23236083984375, -278.6061096191406, -272.9798583984375, -267.3536071777344, -261.7273864746094, -256.10113525390625, -250.47488403320312, -244.84864807128906, -239.222412109375, -233.59616088867188, -227.96994018554688, -222.3437042236328, -216.7174530029297, -211.09121704101562, -205.4649658203125, -199.83872985839844, -194.21249389648438, -188.58624267578125, -182.95999145507812, -177.33375549316406, -171.70750427246094, -166.08126831054688, -160.45501708984375, -154.8287811279297, -149.20254516601562, -143.5762939453125, -137.95005798339844, -132.32382202148438, -126.69757080078125, -121.07133483886719, -115.4450912475586, -109.81884765625, -104.1926040649414, -98.56636047363281, -92.94012451171875, -87.31388092041016, -81.68763732910156, -76.0614013671875, -70.4351577758789, -64.80891418457031, -59.18267059326172, -53.55643081665039, -47.9301872253418, -42.3039436340332, -36.677703857421875, -31.05146026611328, -25.42521858215332, -19.79897689819336, -14.172733306884766, -8.546493530273438, -2.9202499389648438, 2.7059922218322754, 8.332234382629395, 13.958477020263672, 19.584718704223633, 25.210960388183594, 30.837203979492188, 36.463443756103516, 42.08968734741211]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 4.0, 6.0, 5.0, 9.0, 6.0, 6.0, 8.0, 16.0, 18.0, 28.0, 37.0, 34.0, 22.0, 39.0, 34.0, 32.0, 32.0, 32.0, 43.0, 32.0, 50.0, 37.0, 51.0, 40.0, 41.0, 32.0, 42.0, 38.0, 33.0, 29.0, 23.0, 19.0, 19.0, 22.0, 16.0, 11.0, 13.0, 9.0, 9.0, 4.0, 8.0, 2.0, 3.0, 2.0, 5.0, 4.0, 3.0, 1.0, 1.0], "bins": [-70.81964111328125, -68.85372924804688, -66.88780975341797, -64.9218978881836, -62.95598602294922, -60.99007034301758, -59.02415466308594, -57.05824279785156, -55.09232711791992, -53.12641143798828, -51.160499572753906, -49.194583892822266, -47.228668212890625, -45.26275634765625, -43.29684066772461, -41.33092498779297, -39.365013122558594, -37.39909744262695, -35.43318557739258, -33.46726989746094, -31.50135612487793, -29.535442352294922, -27.56952667236328, -25.603612899780273, -23.637699127197266, -21.671785354614258, -19.70587158203125, -17.73995590209961, -15.774042129516602, -13.808128356933594, -11.84221363067627, -9.876298904418945, -7.9103851318359375, -5.9444708824157715, -3.9785566329956055, -2.0126423835754395, -0.04672813415527344, 1.9191856384277344, 3.8851003646850586, 5.851015090942383, 7.816928863525391, 9.782842636108398, 11.748757362365723, 13.714672088623047, 15.680585861206055, 17.646499633789062, 19.612415313720703, 21.57832908630371, 23.54424285888672, 25.510156631469727, 27.476070404052734, 29.441986083984375, 31.407899856567383, 33.37381362915039, 35.33972930908203, 37.305641174316406, 39.27155685424805, 41.23747253417969, 43.20338439941406, 45.1693000793457, 47.135215759277344, 49.10112762451172, 51.06704330444336, 53.032958984375, 54.998870849609375]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 5.0, 4.0, 3.0, 4.0, 8.0, 5.0, 7.0, 10.0, 14.0, 12.0, 14.0, 19.0, 16.0, 16.0, 38.0, 34.0, 29.0, 33.0, 35.0, 44.0, 47.0, 47.0, 47.0, 55.0, 42.0, 42.0, 56.0, 30.0, 41.0, 45.0, 30.0, 21.0, 24.0, 33.0, 15.0, 12.0, 9.0, 15.0, 14.0, 3.0, 8.0, 9.0, 5.0, 7.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.6640625, -7.3819580078125, -7.099853515625, -6.8177490234375, -6.53564453125, -6.2535400390625, -5.971435546875, -5.6893310546875, -5.4072265625, -5.1251220703125, -4.843017578125, -4.5609130859375, -4.27880859375, -3.9967041015625, -3.714599609375, -3.4324951171875, -3.150390625, -2.8682861328125, -2.586181640625, -2.3040771484375, -2.02197265625, -1.7398681640625, -1.457763671875, -1.1756591796875, -0.8935546875, -0.6114501953125, -0.329345703125, -0.0472412109375, 0.23486328125, 0.5169677734375, 0.799072265625, 1.0811767578125, 1.36328125, 1.6453857421875, 1.927490234375, 2.2095947265625, 2.49169921875, 2.7738037109375, 3.055908203125, 3.3380126953125, 3.6201171875, 3.9022216796875, 4.184326171875, 4.4664306640625, 4.74853515625, 5.0306396484375, 5.312744140625, 5.5948486328125, 5.876953125, 6.1590576171875, 6.441162109375, 6.7232666015625, 7.00537109375, 7.2874755859375, 7.569580078125, 7.8516845703125, 8.1337890625, 8.4158935546875, 8.697998046875, 8.9801025390625, 9.26220703125, 9.5443115234375, 9.826416015625, 10.1085205078125, 10.390625]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 6.0, 4.0, 7.0, 14.0, 16.0, 25.0, 25.0, 33.0, 65.0, 78.0, 140.0, 228.0, 291.0, 494.0, 771.0, 1263.0, 1926.0, 3244.0, 5211.0, 8594.0, 14321.0, 23709.0, 39956.0, 66383.0, 110922.0, 169920.0, 200021.0, 155427.0, 98108.0, 58926.0, 35146.0, 20907.0, 12541.0, 7617.0, 4617.0, 2792.0, 1781.0, 1101.0, 709.0, 417.0, 276.0, 180.0, 119.0, 89.0, 47.0, 35.0, 20.0, 17.0, 7.0, 6.0, 6.0, 4.0, 3.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.69921875, -0.6762008666992188, -0.6531829833984375, -0.6301651000976562, -0.607147216796875, -0.5841293334960938, -0.5611114501953125, -0.5380935668945312, -0.51507568359375, -0.49205780029296875, -0.4690399169921875, -0.44602203369140625, -0.423004150390625, -0.39998626708984375, -0.3769683837890625, -0.35395050048828125, -0.3309326171875, -0.30791473388671875, -0.2848968505859375, -0.26187896728515625, -0.238861083984375, -0.21584320068359375, -0.1928253173828125, -0.16980743408203125, -0.14678955078125, -0.12377166748046875, -0.1007537841796875, -0.07773590087890625, -0.054718017578125, -0.03170013427734375, -0.0086822509765625, 0.01433563232421875, 0.037353515625, 0.06037139892578125, 0.0833892822265625, 0.10640716552734375, 0.129425048828125, 0.15244293212890625, 0.1754608154296875, 0.19847869873046875, 0.22149658203125, 0.24451446533203125, 0.2675323486328125, 0.29055023193359375, 0.313568115234375, 0.33658599853515625, 0.3596038818359375, 0.38262176513671875, 0.4056396484375, 0.42865753173828125, 0.4516754150390625, 0.47469329833984375, 0.497711181640625, 0.5207290649414062, 0.5437469482421875, 0.5667648315429688, 0.58978271484375, 0.6128005981445312, 0.6358184814453125, 0.6588363647460938, 0.681854248046875, 0.7048721313476562, 0.7278900146484375, 0.7509078979492188, 0.77392578125]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 5.0, 4.0, 8.0, 4.0, 10.0, 6.0, 6.0, 13.0, 7.0, 9.0, 11.0, 17.0, 20.0, 22.0, 24.0, 21.0, 24.0, 30.0, 39.0, 35.0, 36.0, 35.0, 43.0, 39.0, 34.0, 1059.0, 33.0, 48.0, 29.0, 25.0, 42.0, 28.0, 30.0, 21.0, 21.0, 25.0, 25.0, 21.0, 17.0, 23.0, 17.0, 12.0, 9.0, 7.0, 13.0, 4.0, 6.0, 2.0, 2.0, 3.0, 4.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.89453125, -4.7388916015625, -4.583251953125, -4.4276123046875, -4.27197265625, -4.1163330078125, -3.960693359375, -3.8050537109375, -3.6494140625, -3.4937744140625, -3.338134765625, -3.1824951171875, -3.02685546875, -2.8712158203125, -2.715576171875, -2.5599365234375, -2.404296875, -2.2486572265625, -2.093017578125, -1.9373779296875, -1.78173828125, -1.6260986328125, -1.470458984375, -1.3148193359375, -1.1591796875, -1.0035400390625, -0.847900390625, -0.6922607421875, -0.53662109375, -0.3809814453125, -0.225341796875, -0.0697021484375, 0.0859375, 0.2415771484375, 0.397216796875, 0.5528564453125, 0.70849609375, 0.8641357421875, 1.019775390625, 1.1754150390625, 1.3310546875, 1.4866943359375, 1.642333984375, 1.7979736328125, 1.95361328125, 2.1092529296875, 2.264892578125, 2.4205322265625, 2.576171875, 2.7318115234375, 2.887451171875, 3.0430908203125, 3.19873046875, 3.3543701171875, 3.510009765625, 3.6656494140625, 3.8212890625, 3.9769287109375, 4.132568359375, 4.2882080078125, 4.44384765625, 4.5994873046875, 4.755126953125, 4.9107666015625, 5.06640625]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 6.0, 6.0, 8.0, 14.0, 29.0, 31.0, 52.0, 62.0, 105.0, 140.0, 208.0, 349.0, 466.0, 775.0, 1184.0, 1804.0, 2818.0, 4558.0, 7284.0, 11733.0, 19077.0, 30787.0, 48858.0, 75388.0, 110795.0, 162844.0, 1189205.0, 142319.0, 101632.0, 68085.0, 43826.0, 27342.0, 16953.0, 10512.0, 6584.0, 3992.0, 2555.0, 1674.0, 1024.0, 673.0, 460.0, 313.0, 181.0, 138.0, 96.0, 59.0, 45.0, 32.0, 18.0, 11.0, 11.0, 2.0, 5.0, 6.0, 2.0, 1.0, 2.0, 3.0], "bins": [-0.47119140625, -0.4566383361816406, -0.44208526611328125, -0.4275321960449219, -0.4129791259765625, -0.3984260559082031, -0.38387298583984375, -0.3693199157714844, -0.354766845703125, -0.3402137756347656, -0.32566070556640625, -0.3111076354980469, -0.2965545654296875, -0.2820014953613281, -0.26744842529296875, -0.2528953552246094, -0.23834228515625, -0.22378921508789062, -0.20923614501953125, -0.19468307495117188, -0.1801300048828125, -0.16557693481445312, -0.15102386474609375, -0.13647079467773438, -0.121917724609375, -0.10736465454101562, -0.09281158447265625, -0.07825851440429688, -0.0637054443359375, -0.049152374267578125, -0.03459930419921875, -0.020046234130859375, -0.0054931640625, 0.009059906005859375, 0.02361297607421875, 0.038166046142578125, 0.0527191162109375, 0.06727218627929688, 0.08182525634765625, 0.09637832641601562, 0.110931396484375, 0.12548446655273438, 0.14003753662109375, 0.15459060668945312, 0.1691436767578125, 0.18369674682617188, 0.19824981689453125, 0.21280288696289062, 0.22735595703125, 0.24190902709960938, 0.25646209716796875, 0.2710151672363281, 0.2855682373046875, 0.3001213073730469, 0.31467437744140625, 0.3292274475097656, 0.343780517578125, 0.3583335876464844, 0.37288665771484375, 0.3874397277832031, 0.4019927978515625, 0.4165458679199219, 0.43109893798828125, 0.4456520080566406, 0.460205078125]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 6.0, 3.0, 5.0, 1.0, 10.0, 11.0, 13.0, 11.0, 9.0, 15.0, 17.0, 28.0, 33.0, 32.0, 53.0, 68.0, 89.0, 79.0, 110.0, 95.0, 80.0, 44.0, 40.0, 31.0, 20.0, 22.0, 15.0, 17.0, 12.0, 11.0, 3.0, 3.0, 5.0, 2.0, 5.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0199432373046875, -0.019369125366210938, -0.018795013427734375, -0.018220901489257812, -0.01764678955078125, -0.017072677612304688, -0.016498565673828125, -0.015924453735351562, -0.015350341796875, -0.014776229858398438, -0.014202117919921875, -0.013628005981445312, -0.01305389404296875, -0.012479782104492188, -0.011905670166015625, -0.011331558227539062, -0.0107574462890625, -0.010183334350585938, -0.009609222412109375, -0.009035110473632812, -0.00846099853515625, -0.007886886596679688, -0.007312774658203125, -0.0067386627197265625, -0.00616455078125, -0.0055904388427734375, -0.005016326904296875, -0.0044422149658203125, -0.00386810302734375, -0.0032939910888671875, -0.002719879150390625, -0.0021457672119140625, -0.0015716552734375, -0.0009975433349609375, -0.000423431396484375, 0.0001506805419921875, 0.00072479248046875, 0.0012989044189453125, 0.001873016357421875, 0.0024471282958984375, 0.003021240234375, 0.0035953521728515625, 0.004169464111328125, 0.0047435760498046875, 0.00531768798828125, 0.0058917999267578125, 0.006465911865234375, 0.0070400238037109375, 0.0076141357421875, 0.008188247680664062, 0.008762359619140625, 0.009336471557617188, 0.00991058349609375, 0.010484695434570312, 0.011058807373046875, 0.011632919311523438, 0.01220703125, 0.012781143188476562, 0.013355255126953125, 0.013929367065429688, 0.01450347900390625, 0.015077590942382812, 0.015651702880859375, 0.016225814819335938, 0.0167999267578125]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 4.0, 7.0, 11.0, 12.0, 22.0, 21.0, 29.0, 68.0, 75.0, 141.0, 205.0, 483.0, 4163.0, 990346.0, 51241.0, 988.0, 274.0, 151.0, 89.0, 59.0, 31.0, 35.0, 20.0, 14.0, 11.0, 11.0, 9.0, 6.0, 7.0, 5.0, 0.0, 2.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.352783203125, -0.3413047790527344, -0.32982635498046875, -0.3183479309082031, -0.3068695068359375, -0.2953910827636719, -0.28391265869140625, -0.2724342346191406, -0.260955810546875, -0.24947738647460938, -0.23799896240234375, -0.22652053833007812, -0.2150421142578125, -0.20356369018554688, -0.19208526611328125, -0.18060684204101562, -0.16912841796875, -0.15764999389648438, -0.14617156982421875, -0.13469314575195312, -0.1232147216796875, -0.11173629760742188, -0.10025787353515625, -0.08877944946289062, -0.077301025390625, -0.06582260131835938, -0.05434417724609375, -0.042865753173828125, -0.0313873291015625, -0.019908905029296875, -0.00843048095703125, 0.003047943115234375, 0.0145263671875, 0.026004791259765625, 0.03748321533203125, 0.048961639404296875, 0.0604400634765625, 0.07191848754882812, 0.08339691162109375, 0.09487533569335938, 0.106353759765625, 0.11783218383789062, 0.12931060791015625, 0.14078903198242188, 0.1522674560546875, 0.16374588012695312, 0.17522430419921875, 0.18670272827148438, 0.19818115234375, 0.20965957641601562, 0.22113800048828125, 0.23261642456054688, 0.2440948486328125, 0.2555732727050781, 0.26705169677734375, 0.2785301208496094, 0.290008544921875, 0.3014869689941406, 0.31296539306640625, 0.3244438171386719, 0.3359222412109375, 0.3474006652832031, 0.35887908935546875, 0.3703575134277344, 0.3818359375]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 23.0, 71.0, 178.0, 305.0, 268.0, 117.0, 31.0, 11.0, 8.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0532086119055748, -0.05221925675868988, -0.05122990161180496, -0.050240546464920044, -0.049251195043325424, -0.048261839896440506, -0.04727248474955559, -0.04628312960267067, -0.04529377445578575, -0.04430441930890083, -0.043315064162015915, -0.042325712740421295, -0.04133635759353638, -0.04034700244665146, -0.03935764729976654, -0.03836829215288162, -0.037378937005996704, -0.036389581859111786, -0.03540022671222687, -0.03441087156534195, -0.03342152014374733, -0.03243216499686241, -0.03144280984997749, -0.030453454703092575, -0.029464103281497955, -0.028474748134613037, -0.027485394850373268, -0.02649603970348835, -0.02550668455660343, -0.024517331272363663, -0.023527976125478745, -0.022538620978593826, -0.02154926396906376, -0.02055990882217884, -0.01957055553793907, -0.018581200391054153, -0.017591845244169235, -0.016602490097284317, -0.015613136813044548, -0.01462378166615963, -0.013634427450597286, -0.012645073235034943, -0.011655718088150024, -0.01066636387258768, -0.009677009657025337, -0.008687654510140419, -0.007698300294578075, -0.0067089456133544445, -0.005719590932130814, -0.004730236250907183, -0.0037408818025141954, -0.002751527354121208, -0.0017621726728975773, -0.0007728179916739464, 0.00021653622388839722, 0.0012058909051120281, 0.002195245586335659, 0.00318460026755929, 0.004173954948782921, 0.0051633091643452644, 0.006152663845568895, 0.007142018526792526, 0.00813137274235487, 0.009120726957917213, 0.010110082104802132]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [5.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 6.0, 6.0, 4.0, 2.0, 11.0, 10.0, 9.0, 16.0, 18.0, 17.0, 19.0, 34.0, 21.0, 32.0, 38.0, 38.0, 39.0, 45.0, 45.0, 36.0, 37.0, 45.0, 37.0, 41.0, 38.0, 42.0, 54.0, 33.0, 31.0, 27.0, 29.0, 18.0, 19.0, 20.0, 13.0, 10.0, 13.0, 9.0, 16.0, 6.0, 5.0, 5.0, 5.0, 2.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007885932922363281, -0.007606863975524902, -0.0073277950286865234, -0.0070487260818481445, -0.006769657135009766, -0.006490588188171387, -0.006211519241333008, -0.005932450294494629, -0.00565338134765625, -0.005374312400817871, -0.005095243453979492, -0.004816174507141113, -0.004537105560302734, -0.0042580366134643555, -0.0039789676666259766, -0.0036998987197875977, -0.0034208297729492188, -0.00314176082611084, -0.002862691879272461, -0.002583622932434082, -0.002304553985595703, -0.0020254850387573242, -0.0017464160919189453, -0.0014673471450805664, -0.0011882781982421875, -0.0009092092514038086, -0.0006301403045654297, -0.0003510713577270508, -7.200241088867188e-05, 0.00020706653594970703, 0.00048613548278808594, 0.0007652044296264648, 0.0010442733764648438, 0.0013233423233032227, 0.0016024112701416016, 0.0018814802169799805, 0.0021605491638183594, 0.0024396181106567383, 0.002718687057495117, 0.002997756004333496, 0.003276824951171875, 0.003555893898010254, 0.003834962844848633, 0.004114031791687012, 0.004393100738525391, 0.0046721696853637695, 0.0049512386322021484, 0.005230307579040527, 0.005509376525878906, 0.005788445472717285, 0.006067514419555664, 0.006346583366394043, 0.006625652313232422, 0.006904721260070801, 0.00718379020690918, 0.007462859153747559, 0.0077419281005859375, 0.008020997047424316, 0.008300065994262695, 0.008579134941101074, 0.008858203887939453, 0.009137272834777832, 0.009416341781616211, 0.00969541072845459, 0.009974479675292969]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 5.0, 4.0, 3.0, 4.0, 8.0, 5.0, 7.0, 10.0, 14.0, 12.0, 14.0, 19.0, 16.0, 16.0, 38.0, 34.0, 29.0, 33.0, 35.0, 44.0, 47.0, 47.0, 47.0, 55.0, 42.0, 42.0, 56.0, 30.0, 41.0, 45.0, 30.0, 21.0, 24.0, 33.0, 15.0, 12.0, 9.0, 15.0, 14.0, 3.0, 8.0, 9.0, 5.0, 7.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.6640625, -7.3819580078125, -7.099853515625, -6.8177490234375, -6.53564453125, -6.2535400390625, -5.971435546875, -5.6893310546875, -5.4072265625, -5.1251220703125, -4.843017578125, -4.5609130859375, -4.27880859375, -3.9967041015625, -3.714599609375, -3.4324951171875, -3.150390625, -2.8682861328125, -2.586181640625, -2.3040771484375, -2.02197265625, -1.7398681640625, -1.457763671875, -1.1756591796875, -0.8935546875, -0.6114501953125, -0.329345703125, -0.0472412109375, 0.23486328125, 0.5169677734375, 0.799072265625, 1.0811767578125, 1.36328125, 1.6453857421875, 1.927490234375, 2.2095947265625, 2.49169921875, 2.7738037109375, 3.055908203125, 3.3380126953125, 3.6201171875, 3.9022216796875, 4.184326171875, 4.4664306640625, 4.74853515625, 5.0306396484375, 5.312744140625, 5.5948486328125, 5.876953125, 6.1590576171875, 6.441162109375, 6.7232666015625, 7.00537109375, 7.2874755859375, 7.569580078125, 7.8516845703125, 8.1337890625, 8.4158935546875, 8.697998046875, 8.9801025390625, 9.26220703125, 9.5443115234375, 9.826416015625, 10.1085205078125, 10.390625]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 10.0, 7.0, 8.0, 23.0, 25.0, 39.0, 69.0, 113.0, 171.0, 304.0, 607.0, 990.0, 1919.0, 3655.0, 6938.0, 14079.0, 30093.0, 70928.0, 212224.0, 449762.0, 152606.0, 55486.0, 24375.0, 11608.0, 5821.0, 2969.0, 1683.0, 918.0, 482.0, 274.0, 141.0, 99.0, 52.0, 31.0, 21.0, 13.0, 5.0, 8.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.63671875, -7.4078369140625, -7.178955078125, -6.9500732421875, -6.72119140625, -6.4923095703125, -6.263427734375, -6.0345458984375, -5.8056640625, -5.5767822265625, -5.347900390625, -5.1190185546875, -4.89013671875, -4.6612548828125, -4.432373046875, -4.2034912109375, -3.974609375, -3.7457275390625, -3.516845703125, -3.2879638671875, -3.05908203125, -2.8302001953125, -2.601318359375, -2.3724365234375, -2.1435546875, -1.9146728515625, -1.685791015625, -1.4569091796875, -1.22802734375, -0.9991455078125, -0.770263671875, -0.5413818359375, -0.3125, -0.0836181640625, 0.145263671875, 0.3741455078125, 0.60302734375, 0.8319091796875, 1.060791015625, 1.2896728515625, 1.5185546875, 1.7474365234375, 1.976318359375, 2.2052001953125, 2.43408203125, 2.6629638671875, 2.891845703125, 3.1207275390625, 3.349609375, 3.5784912109375, 3.807373046875, 4.0362548828125, 4.26513671875, 4.4940185546875, 4.722900390625, 4.9517822265625, 5.1806640625, 5.4095458984375, 5.638427734375, 5.8673095703125, 6.09619140625, 6.3250732421875, 6.553955078125, 6.7828369140625, 7.01171875]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 1.0, 9.0, 5.0, 6.0, 9.0, 11.0, 9.0, 20.0, 21.0, 19.0, 25.0, 31.0, 26.0, 40.0, 50.0, 36.0, 58.0, 61.0, 96.0, 176.0, 1607.0, 174.0, 93.0, 67.0, 55.0, 52.0, 39.0, 35.0, 31.0, 32.0, 29.0, 26.0, 20.0, 17.0, 13.0, 11.0, 10.0, 9.0, 7.0, 5.0, 7.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-40.15625, -39.056396484375, -37.95654296875, -36.856689453125, -35.7568359375, -34.656982421875, -33.55712890625, -32.457275390625, -31.357421875, -30.257568359375, -29.15771484375, -28.057861328125, -26.9580078125, -25.858154296875, -24.75830078125, -23.658447265625, -22.55859375, -21.458740234375, -20.35888671875, -19.259033203125, -18.1591796875, -17.059326171875, -15.95947265625, -14.859619140625, -13.759765625, -12.659912109375, -11.56005859375, -10.460205078125, -9.3603515625, -8.260498046875, -7.16064453125, -6.060791015625, -4.9609375, -3.861083984375, -2.76123046875, -1.661376953125, -0.5615234375, 0.538330078125, 1.63818359375, 2.738037109375, 3.837890625, 4.937744140625, 6.03759765625, 7.137451171875, 8.2373046875, 9.337158203125, 10.43701171875, 11.536865234375, 12.63671875, 13.736572265625, 14.83642578125, 15.936279296875, 17.0361328125, 18.135986328125, 19.23583984375, 20.335693359375, 21.435546875, 22.535400390625, 23.63525390625, 24.735107421875, 25.8349609375, 26.934814453125, 28.03466796875, 29.134521484375, 30.234375]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 11.0, 29.0, 40.0, 58.0, 66.0, 159.0, 261.0, 678.0, 5032.0, 3117462.0, 20080.0, 1107.0, 305.0, 159.0, 100.0, 65.0, 28.0, 24.0, 9.0, 6.0, 4.0, 2.0, 5.0, 3.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-123.5, -118.490234375, -113.48046875, -108.470703125, -103.4609375, -98.451171875, -93.44140625, -88.431640625, -83.421875, -78.412109375, -73.40234375, -68.392578125, -63.3828125, -58.373046875, -53.36328125, -48.353515625, -43.34375, -38.333984375, -33.32421875, -28.314453125, -23.3046875, -18.294921875, -13.28515625, -8.275390625, -3.265625, 1.744140625, 6.75390625, 11.763671875, 16.7734375, 21.783203125, 26.79296875, 31.802734375, 36.8125, 41.822265625, 46.83203125, 51.841796875, 56.8515625, 61.861328125, 66.87109375, 71.880859375, 76.890625, 81.900390625, 86.91015625, 91.919921875, 96.9296875, 101.939453125, 106.94921875, 111.958984375, 116.96875, 121.978515625, 126.98828125, 131.998046875, 137.0078125, 142.017578125, 147.02734375, 152.037109375, 157.046875, 162.056640625, 167.06640625, 172.076171875, 177.0859375, 182.095703125, 187.10546875, 192.115234375, 197.125]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 267.0, 750.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-125.93272399902344, -95.29681396484375, -64.66090393066406, -34.024986267089844, -3.3890762329101562, 27.246841430664062, 57.88275146484375, 88.51866149902344, 119.15457153320312, 149.7904815673828, 180.4263916015625, 211.06231689453125, 241.69821166992188, 272.3341369628906, 302.97003173828125, 333.60595703125, 364.24188232421875, 394.8778076171875, 425.5137023925781, 456.1496276855469, 486.7855224609375, 517.4214477539062, 548.057373046875, 578.6932373046875, 609.3291625976562, 639.965087890625, 670.6010131835938, 701.2368774414062, 731.872802734375, 762.5087280273438, 793.1446533203125, 823.780517578125, 854.4164428710938, 885.0523681640625, 915.6882934570312, 946.3241577148438, 976.9600830078125, 1007.5960083007812, 1038.23193359375, 1068.8677978515625, 1099.5037841796875, 1130.1396484375, 1160.775634765625, 1191.4114990234375, 1222.0474853515625, 1252.683349609375, 1283.3192138671875, 1313.9552001953125, 1344.591064453125, 1375.2269287109375, 1405.8629150390625, 1436.498779296875, 1467.134765625, 1497.7706298828125, 1528.406494140625, 1559.04248046875, 1589.6783447265625, 1620.314208984375, 1650.9501953125, 1681.5860595703125, 1712.2220458984375, 1742.85791015625, 1773.4937744140625, 1804.1297607421875, 1834.765625]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 3.0, 4.0, 4.0, 3.0, 3.0, 7.0, 6.0, 9.0, 16.0, 11.0, 15.0, 11.0, 28.0, 31.0, 18.0, 23.0, 37.0, 27.0, 35.0, 42.0, 34.0, 56.0, 39.0, 41.0, 54.0, 57.0, 44.0, 46.0, 34.0, 20.0, 33.0, 37.0, 33.0, 24.0, 31.0, 18.0, 25.0, 14.0, 10.0, 3.0, 8.0, 4.0, 4.0, 6.0, 2.0, 1.0, 0.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-93.95695495605469, -90.6125259399414, -87.2680892944336, -83.92366027832031, -80.57923126220703, -77.23479461669922, -73.89036560058594, -70.54592895507812, -67.20149993896484, -63.8570671081543, -60.512638092041016, -57.16820526123047, -53.82377243041992, -50.479339599609375, -47.134910583496094, -43.79047775268555, -40.446048736572266, -37.10161590576172, -33.75718688964844, -30.41275405883789, -27.068321228027344, -23.72389030456543, -20.379459381103516, -17.03502655029297, -13.690595626831055, -10.346163749694824, -7.001732349395752, -3.6573009490966797, -0.3128690719604492, 3.0315628051757812, 6.375993728637695, 9.720426559448242, 13.064857482910156, 16.40928840637207, 19.753721237182617, 23.09815216064453, 26.442584991455078, 29.787015914916992, 33.131446838378906, 36.47587966918945, 39.8203125, 43.16474533081055, 46.50917434692383, 49.853607177734375, 53.19804000854492, 56.54247283935547, 59.88690185546875, 63.2313346862793, 66.57575988769531, 69.9201889038086, 73.2646255493164, 76.60905456542969, 79.95348358154297, 83.29792022705078, 86.64234924316406, 89.98678588867188, 93.33121490478516, 96.67564392089844, 100.02008056640625, 103.36450958251953, 106.70893859863281, 110.05337524414062, 113.3978042602539, 116.74223327636719, 120.086669921875]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 1.0, 2.0, 5.0, 8.0, 6.0, 7.0, 13.0, 9.0, 15.0, 16.0, 16.0, 20.0, 16.0, 14.0, 30.0, 35.0, 29.0, 46.0, 40.0, 44.0, 60.0, 40.0, 54.0, 46.0, 44.0, 43.0, 43.0, 31.0, 37.0, 33.0, 23.0, 22.0, 31.0, 16.0, 23.0, 17.0, 17.0, 8.0, 11.0, 11.0, 5.0, 8.0, 6.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.625, -8.323974609375, -8.02294921875, -7.721923828125, -7.4208984375, -7.119873046875, -6.81884765625, -6.517822265625, -6.216796875, -5.915771484375, -5.61474609375, -5.313720703125, -5.0126953125, -4.711669921875, -4.41064453125, -4.109619140625, -3.80859375, -3.507568359375, -3.20654296875, -2.905517578125, -2.6044921875, -2.303466796875, -2.00244140625, -1.701416015625, -1.400390625, -1.099365234375, -0.79833984375, -0.497314453125, -0.1962890625, 0.104736328125, 0.40576171875, 0.706787109375, 1.0078125, 1.308837890625, 1.60986328125, 1.910888671875, 2.2119140625, 2.512939453125, 2.81396484375, 3.114990234375, 3.416015625, 3.717041015625, 4.01806640625, 4.319091796875, 4.6201171875, 4.921142578125, 5.22216796875, 5.523193359375, 5.82421875, 6.125244140625, 6.42626953125, 6.727294921875, 7.0283203125, 7.329345703125, 7.63037109375, 7.931396484375, 8.232421875, 8.533447265625, 8.83447265625, 9.135498046875, 9.4365234375, 9.737548828125, 10.03857421875, 10.339599609375, 10.640625]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 5.0, 7.0, 15.0, 13.0, 34.0, 26.0, 58.0, 87.0, 116.0, 170.0, 257.0, 479.0, 831.0, 1591.0, 2904.0, 6503.0, 14813.0, 37871.0, 114134.0, 412305.0, 1196930.0, 1497602.0, 635409.0, 179768.0, 54715.0, 20439.0, 8590.0, 4056.0, 1984.0, 1026.0, 567.0, 357.0, 183.0, 134.0, 98.0, 54.0, 35.0, 30.0, 32.0, 15.0, 10.0, 10.0, 5.0, 2.0, 3.0, 4.0, 0.0, 2.0, 1.0, 2.0, 2.0], "bins": [-12.1875, -11.8309326171875, -11.474365234375, -11.1177978515625, -10.76123046875, -10.4046630859375, -10.048095703125, -9.6915283203125, -9.3349609375, -8.9783935546875, -8.621826171875, -8.2652587890625, -7.90869140625, -7.5521240234375, -7.195556640625, -6.8389892578125, -6.482421875, -6.1258544921875, -5.769287109375, -5.4127197265625, -5.05615234375, -4.6995849609375, -4.343017578125, -3.9864501953125, -3.6298828125, -3.2733154296875, -2.916748046875, -2.5601806640625, -2.20361328125, -1.8470458984375, -1.490478515625, -1.1339111328125, -0.77734375, -0.4207763671875, -0.064208984375, 0.2923583984375, 0.64892578125, 1.0054931640625, 1.362060546875, 1.7186279296875, 2.0751953125, 2.4317626953125, 2.788330078125, 3.1448974609375, 3.50146484375, 3.8580322265625, 4.214599609375, 4.5711669921875, 4.927734375, 5.2843017578125, 5.640869140625, 5.9974365234375, 6.35400390625, 6.7105712890625, 7.067138671875, 7.4237060546875, 7.7802734375, 8.1368408203125, 8.493408203125, 8.8499755859375, 9.20654296875, 9.5631103515625, 9.919677734375, 10.2762451171875, 10.6328125]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 6.0, 18.0, 7.0, 26.0, 27.0, 36.0, 88.0, 110.0, 153.0, 264.0, 410.0, 528.0, 586.0, 573.0, 416.0, 276.0, 200.0, 117.0, 73.0, 46.0, 41.0, 27.0, 20.0, 10.0, 6.0, 7.0, 4.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.6875, -18.85302734375, -18.0185546875, -17.18408203125, -16.349609375, -15.51513671875, -14.6806640625, -13.84619140625, -13.01171875, -12.17724609375, -11.3427734375, -10.50830078125, -9.673828125, -8.83935546875, -8.0048828125, -7.17041015625, -6.3359375, -5.50146484375, -4.6669921875, -3.83251953125, -2.998046875, -2.16357421875, -1.3291015625, -0.49462890625, 0.33984375, 1.17431640625, 2.0087890625, 2.84326171875, 3.677734375, 4.51220703125, 5.3466796875, 6.18115234375, 7.015625, 7.85009765625, 8.6845703125, 9.51904296875, 10.353515625, 11.18798828125, 12.0224609375, 12.85693359375, 13.69140625, 14.52587890625, 15.3603515625, 16.19482421875, 17.029296875, 17.86376953125, 18.6982421875, 19.53271484375, 20.3671875, 21.20166015625, 22.0361328125, 22.87060546875, 23.705078125, 24.53955078125, 25.3740234375, 26.20849609375, 27.04296875, 27.87744140625, 28.7119140625, 29.54638671875, 30.380859375, 31.21533203125, 32.0498046875, 32.88427734375, 33.71875]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 5.0, 2.0, 9.0, 6.0, 11.0, 27.0, 24.0, 46.0, 52.0, 85.0, 83.0, 132.0, 196.0, 302.0, 647.0, 1998.0, 9695.0, 76845.0, 1108642.0, 2749020.0, 218930.0, 21747.0, 3593.0, 956.0, 443.0, 221.0, 179.0, 100.0, 76.0, 54.0, 37.0, 41.0, 28.0, 15.0, 10.0, 14.0, 5.0, 3.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-45.15625, -43.9091796875, -42.662109375, -41.4150390625, -40.16796875, -38.9208984375, -37.673828125, -36.4267578125, -35.1796875, -33.9326171875, -32.685546875, -31.4384765625, -30.19140625, -28.9443359375, -27.697265625, -26.4501953125, -25.203125, -23.9560546875, -22.708984375, -21.4619140625, -20.21484375, -18.9677734375, -17.720703125, -16.4736328125, -15.2265625, -13.9794921875, -12.732421875, -11.4853515625, -10.23828125, -8.9912109375, -7.744140625, -6.4970703125, -5.25, -4.0029296875, -2.755859375, -1.5087890625, -0.26171875, 0.9853515625, 2.232421875, 3.4794921875, 4.7265625, 5.9736328125, 7.220703125, 8.4677734375, 9.71484375, 10.9619140625, 12.208984375, 13.4560546875, 14.703125, 15.9501953125, 17.197265625, 18.4443359375, 19.69140625, 20.9384765625, 22.185546875, 23.4326171875, 24.6796875, 25.9267578125, 27.173828125, 28.4208984375, 29.66796875, 30.9150390625, 32.162109375, 33.4091796875, 34.65625]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 18.0, 21.0, 44.0, 93.0, 114.0, 144.0, 160.0, 148.0, 121.0, 63.0, 34.0, 24.0, 12.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-159.43276977539062, -154.79037475585938, -150.14797973632812, -145.50558471679688, -140.86318969726562, -136.22079467773438, -131.57839965820312, -126.93600463867188, -122.29360961914062, -117.65121459960938, -113.00881958007812, -108.36642456054688, -103.72402954101562, -99.08163452148438, -94.43923950195312, -89.79684448242188, -85.15444946289062, -80.51205444335938, -75.86965942382812, -71.22726440429688, -66.58486938476562, -61.942474365234375, -57.300079345703125, -52.657684326171875, -48.015289306640625, -43.372894287109375, -38.730499267578125, -34.088104248046875, -29.445709228515625, -24.803314208984375, -20.160919189453125, -15.518524169921875, -10.876113891601562, -6.2337188720703125, -1.5913238525390625, 3.0510711669921875, 7.6934661865234375, 12.335861206054688, 16.978256225585938, 21.620651245117188, 26.263046264648438, 30.905441284179688, 35.54783630371094, 40.19023132324219, 44.83262634277344, 49.47502136230469, 54.11741638183594, 58.75981140136719, 63.40220642089844, 68.04460144042969, 72.68699645996094, 77.32939147949219, 81.97178649902344, 86.61418151855469, 91.25657653808594, 95.89897155761719, 100.54136657714844, 105.18376159667969, 109.82615661621094, 114.46855163574219, 119.11094665527344, 123.75334167480469, 128.39573669433594, 133.0381317138672, 137.68052673339844]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 4.0, 5.0, 2.0, 8.0, 9.0, 16.0, 15.0, 15.0, 15.0, 24.0, 38.0, 40.0, 47.0, 43.0, 36.0, 38.0, 50.0, 50.0, 46.0, 49.0, 58.0, 42.0, 42.0, 46.0, 41.0, 39.0, 36.0, 26.0, 30.0, 15.0, 27.0, 22.0, 9.0, 3.0, 7.0, 5.0, 1.0, 5.0, 3.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.790191650390625, -59.394737243652344, -56.9992790222168, -54.603824615478516, -52.20836639404297, -49.81291198730469, -47.417457580566406, -45.022003173828125, -42.62654495239258, -40.2310905456543, -37.83563232421875, -35.44017791748047, -33.04472351074219, -30.64926528930664, -28.25381088256836, -25.858354568481445, -23.46289825439453, -21.067441940307617, -18.671985626220703, -16.276531219482422, -13.881074905395508, -11.485618591308594, -9.090163230895996, -6.694707870483398, -4.299251556396484, -1.9037957191467285, 0.49166011810302734, 2.887115955352783, 5.282571792602539, 7.678028106689453, 10.07348346710205, 12.468938827514648, 14.864395141601562, 17.259851455688477, 19.65530776977539, 22.050762176513672, 24.446218490600586, 26.8416748046875, 29.23712921142578, 31.632585525512695, 34.02804183959961, 36.42349624633789, 38.81895446777344, 41.21440887451172, 43.60986328125, 46.00532150268555, 48.40077590942383, 50.796234130859375, 53.191688537597656, 55.58714294433594, 57.982601165771484, 60.378055572509766, 62.77351379394531, 65.1689682006836, 67.56442260742188, 69.95987701416016, 72.35533142089844, 74.75078582763672, 77.146240234375, 79.54170227050781, 81.9371566772461, 84.33261108398438, 86.72806549072266, 89.12351989746094, 91.51898193359375]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 7.0, 6.0, 9.0, 10.0, 8.0, 15.0, 19.0, 9.0, 20.0, 18.0, 21.0, 26.0, 33.0, 34.0, 39.0, 42.0, 37.0, 53.0, 39.0, 34.0, 38.0, 61.0, 48.0, 37.0, 42.0, 51.0, 33.0, 25.0, 35.0, 26.0, 33.0, 15.0, 8.0, 19.0, 10.0, 7.0, 11.0, 8.0, 9.0, 5.0, 3.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.7265625, -8.4281005859375, -8.129638671875, -7.8311767578125, -7.53271484375, -7.2342529296875, -6.935791015625, -6.6373291015625, -6.3388671875, -6.0404052734375, -5.741943359375, -5.4434814453125, -5.14501953125, -4.8465576171875, -4.548095703125, -4.2496337890625, -3.951171875, -3.6527099609375, -3.354248046875, -3.0557861328125, -2.75732421875, -2.4588623046875, -2.160400390625, -1.8619384765625, -1.5634765625, -1.2650146484375, -0.966552734375, -0.6680908203125, -0.36962890625, -0.0711669921875, 0.227294921875, 0.5257568359375, 0.82421875, 1.1226806640625, 1.421142578125, 1.7196044921875, 2.01806640625, 2.3165283203125, 2.614990234375, 2.9134521484375, 3.2119140625, 3.5103759765625, 3.808837890625, 4.1072998046875, 4.40576171875, 4.7042236328125, 5.002685546875, 5.3011474609375, 5.599609375, 5.8980712890625, 6.196533203125, 6.4949951171875, 6.79345703125, 7.0919189453125, 7.390380859375, 7.6888427734375, 7.9873046875, 8.2857666015625, 8.584228515625, 8.8826904296875, 9.18115234375, 9.4796142578125, 9.778076171875, 10.0765380859375, 10.375]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 5.0, 3.0, 1.0, 3.0, 8.0, 7.0, 17.0, 22.0, 29.0, 53.0, 58.0, 89.0, 125.0, 206.0, 275.0, 440.0, 577.0, 893.0, 1348.0, 1991.0, 2894.0, 4225.0, 6057.0, 9475.0, 13748.0, 20324.0, 29870.0, 44357.0, 64939.0, 94786.0, 130810.0, 154723.0, 139053.0, 103717.0, 72053.0, 49097.0, 32945.0, 22494.0, 15138.0, 10158.0, 6901.0, 4620.0, 3145.0, 2199.0, 1510.0, 1003.0, 695.0, 474.0, 314.0, 216.0, 151.0, 113.0, 61.0, 41.0, 45.0, 17.0, 25.0, 11.0, 5.0, 7.0, 2.0, 5.0, 2.0], "bins": [-0.63427734375, -0.614837646484375, -0.59539794921875, -0.575958251953125, -0.5565185546875, -0.537078857421875, -0.51763916015625, -0.498199462890625, -0.478759765625, -0.459320068359375, -0.43988037109375, -0.420440673828125, -0.4010009765625, -0.381561279296875, -0.36212158203125, -0.342681884765625, -0.3232421875, -0.303802490234375, -0.28436279296875, -0.264923095703125, -0.2454833984375, -0.226043701171875, -0.20660400390625, -0.187164306640625, -0.167724609375, -0.148284912109375, -0.12884521484375, -0.109405517578125, -0.0899658203125, -0.070526123046875, -0.05108642578125, -0.031646728515625, -0.01220703125, 0.007232666015625, 0.02667236328125, 0.046112060546875, 0.0655517578125, 0.084991455078125, 0.10443115234375, 0.123870849609375, 0.143310546875, 0.162750244140625, 0.18218994140625, 0.201629638671875, 0.2210693359375, 0.240509033203125, 0.25994873046875, 0.279388427734375, 0.298828125, 0.318267822265625, 0.33770751953125, 0.357147216796875, 0.3765869140625, 0.396026611328125, 0.41546630859375, 0.434906005859375, 0.454345703125, 0.473785400390625, 0.49322509765625, 0.512664794921875, 0.5321044921875, 0.551544189453125, 0.57098388671875, 0.590423583984375, 0.60986328125]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 4.0, 5.0, 9.0, 8.0, 7.0, 9.0, 18.0, 14.0, 23.0, 27.0, 26.0, 41.0, 29.0, 46.0, 40.0, 36.0, 38.0, 51.0, 32.0, 1059.0, 44.0, 42.0, 42.0, 45.0, 39.0, 33.0, 40.0, 28.0, 26.0, 34.0, 20.0, 22.0, 22.0, 12.0, 13.0, 10.0, 14.0, 6.0, 3.0, 4.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0], "bins": [-6.71875, -6.53179931640625, -6.3448486328125, -6.15789794921875, -5.970947265625, -5.78399658203125, -5.5970458984375, -5.41009521484375, -5.22314453125, -5.03619384765625, -4.8492431640625, -4.66229248046875, -4.475341796875, -4.28839111328125, -4.1014404296875, -3.91448974609375, -3.7275390625, -3.54058837890625, -3.3536376953125, -3.16668701171875, -2.979736328125, -2.79278564453125, -2.6058349609375, -2.41888427734375, -2.23193359375, -2.04498291015625, -1.8580322265625, -1.67108154296875, -1.484130859375, -1.29718017578125, -1.1102294921875, -0.92327880859375, -0.736328125, -0.54937744140625, -0.3624267578125, -0.17547607421875, 0.011474609375, 0.19842529296875, 0.3853759765625, 0.57232666015625, 0.75927734375, 0.94622802734375, 1.1331787109375, 1.32012939453125, 1.507080078125, 1.69403076171875, 1.8809814453125, 2.06793212890625, 2.2548828125, 2.44183349609375, 2.6287841796875, 2.81573486328125, 3.002685546875, 3.18963623046875, 3.3765869140625, 3.56353759765625, 3.75048828125, 3.93743896484375, 4.1243896484375, 4.31134033203125, 4.498291015625, 4.68524169921875, 4.8721923828125, 5.05914306640625, 5.24609375]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 5.0, 10.0, 16.0, 27.0, 38.0, 57.0, 92.0, 188.0, 294.0, 423.0, 792.0, 1450.0, 2352.0, 3917.0, 6674.0, 11205.0, 19251.0, 32316.0, 53299.0, 85624.0, 128299.0, 396966.0, 984090.0, 135279.0, 91720.0, 57649.0, 34869.0, 20749.0, 12139.0, 7271.0, 4145.0, 2406.0, 1449.0, 805.0, 493.0, 296.0, 206.0, 101.0, 66.0, 44.0, 23.0, 15.0, 6.0, 9.0, 4.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.50732421875, -0.490997314453125, -0.47467041015625, -0.458343505859375, -0.4420166015625, -0.425689697265625, -0.40936279296875, -0.393035888671875, -0.376708984375, -0.360382080078125, -0.34405517578125, -0.327728271484375, -0.3114013671875, -0.295074462890625, -0.27874755859375, -0.262420654296875, -0.24609375, -0.229766845703125, -0.21343994140625, -0.197113037109375, -0.1807861328125, -0.164459228515625, -0.14813232421875, -0.131805419921875, -0.115478515625, -0.099151611328125, -0.08282470703125, -0.066497802734375, -0.0501708984375, -0.033843994140625, -0.01751708984375, -0.001190185546875, 0.01513671875, 0.031463623046875, 0.04779052734375, 0.064117431640625, 0.0804443359375, 0.096771240234375, 0.11309814453125, 0.129425048828125, 0.145751953125, 0.162078857421875, 0.17840576171875, 0.194732666015625, 0.2110595703125, 0.227386474609375, 0.24371337890625, 0.260040283203125, 0.2763671875, 0.292694091796875, 0.30902099609375, 0.325347900390625, 0.3416748046875, 0.358001708984375, 0.37432861328125, 0.390655517578125, 0.406982421875, 0.423309326171875, 0.43963623046875, 0.455963134765625, 0.4722900390625, 0.488616943359375, 0.50494384765625, 0.521270751953125, 0.53759765625]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 3.0, 3.0, 4.0, 5.0, 7.0, 6.0, 9.0, 11.0, 14.0, 17.0, 15.0, 16.0, 23.0, 22.0, 32.0, 41.0, 39.0, 60.0, 69.0, 82.0, 105.0, 77.0, 72.0, 53.0, 39.0, 18.0, 29.0, 22.0, 20.0, 23.0, 11.0, 12.0, 7.0, 10.0, 10.0, 8.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 4.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0155792236328125, -0.015065908432006836, -0.014552593231201172, -0.014039278030395508, -0.013525962829589844, -0.01301264762878418, -0.012499332427978516, -0.011986017227172852, -0.011472702026367188, -0.010959386825561523, -0.01044607162475586, -0.009932756423950195, -0.009419441223144531, -0.008906126022338867, -0.008392810821533203, -0.007879495620727539, -0.007366180419921875, -0.006852865219116211, -0.006339550018310547, -0.005826234817504883, -0.005312919616699219, -0.004799604415893555, -0.004286289215087891, -0.0037729740142822266, -0.0032596588134765625, -0.0027463436126708984, -0.0022330284118652344, -0.0017197132110595703, -0.0012063980102539062, -0.0006930828094482422, -0.00017976760864257812, 0.00033354759216308594, 0.00084686279296875, 0.001360177993774414, 0.0018734931945800781, 0.002386808395385742, 0.0029001235961914062, 0.0034134387969970703, 0.003926753997802734, 0.0044400691986083984, 0.0049533843994140625, 0.0054666996002197266, 0.005980014801025391, 0.006493330001831055, 0.007006645202636719, 0.007519960403442383, 0.008033275604248047, 0.008546590805053711, 0.009059906005859375, 0.009573221206665039, 0.010086536407470703, 0.010599851608276367, 0.011113166809082031, 0.011626482009887695, 0.01213979721069336, 0.012653112411499023, 0.013166427612304688, 0.013679742813110352, 0.014193058013916016, 0.01470637321472168, 0.015219688415527344, 0.015733003616333008, 0.016246318817138672, 0.016759634017944336, 0.01727294921875]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 1.0, 2.0, 3.0, 6.0, 3.0, 4.0, 9.0, 7.0, 12.0, 13.0, 16.0, 17.0, 17.0, 18.0, 31.0, 46.0, 65.0, 118.0, 225.0, 669.0, 8218.0, 899828.0, 135800.0, 2429.0, 441.0, 167.0, 98.0, 70.0, 41.0, 37.0, 15.0, 25.0, 24.0, 15.0, 3.0, 16.0, 8.0, 4.0, 5.0, 9.0, 7.0, 4.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.339111328125, -0.3290824890136719, -0.31905364990234375, -0.3090248107910156, -0.2989959716796875, -0.2889671325683594, -0.27893829345703125, -0.2689094543457031, -0.258880615234375, -0.24885177612304688, -0.23882293701171875, -0.22879409790039062, -0.2187652587890625, -0.20873641967773438, -0.19870758056640625, -0.18867874145507812, -0.17864990234375, -0.16862106323242188, -0.15859222412109375, -0.14856338500976562, -0.1385345458984375, -0.12850570678710938, -0.11847686767578125, -0.10844802856445312, -0.098419189453125, -0.08839035034179688, -0.07836151123046875, -0.06833267211914062, -0.0583038330078125, -0.048274993896484375, -0.03824615478515625, -0.028217315673828125, -0.0181884765625, -0.008159637451171875, 0.00186920166015625, 0.011898040771484375, 0.0219268798828125, 0.031955718994140625, 0.04198455810546875, 0.052013397216796875, 0.062042236328125, 0.07207107543945312, 0.08209991455078125, 0.09212875366210938, 0.1021575927734375, 0.11218643188476562, 0.12221527099609375, 0.13224411010742188, 0.14227294921875, 0.15230178833007812, 0.16233062744140625, 0.17235946655273438, 0.1823883056640625, 0.19241714477539062, 0.20244598388671875, 0.21247482299804688, 0.222503662109375, 0.23253250122070312, 0.24256134033203125, 0.2525901794433594, 0.2626190185546875, 0.2726478576660156, 0.28267669677734375, 0.2927055358886719, 0.302734375]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 26.0, 482.0, 483.0, 25.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.018005209043622017, -0.014414839446544647, -0.010824470780789852, -0.007234102115035057, -0.0036437325179576874, -5.336292088031769e-05, 0.0035370048135519028, 0.0071273744106292725, 0.010717744007706642, 0.014308113604784012, 0.017898481339216232, 0.021488850936293602, 0.02507922053337097, 0.02866959013044834, 0.03225995600223541, 0.03585032746195793, 0.03944069892168045, 0.04303106665611267, 0.04662143811583519, 0.05021180585026741, 0.05380217730998993, 0.05739254504442215, 0.06098291277885437, 0.06457328051328659, 0.06816364824771881, 0.07175401598215103, 0.07534438371658325, 0.07893475890159607, 0.08252512663602829, 0.08611549437046051, 0.08970586210489273, 0.09329622983932495, 0.09688660502433777, 0.10047697275876999, 0.10406734049320221, 0.10765771567821503, 0.11124808341264725, 0.11483845114707947, 0.11842881888151169, 0.12201918661594391, 0.12560956180095673, 0.12919993698596954, 0.13279029726982117, 0.13638067245483398, 0.1399710327386856, 0.14356140792369843, 0.14715176820755005, 0.15074214339256287, 0.15433251857757568, 0.1579228937625885, 0.16151325404644012, 0.16510362923145294, 0.16869398951530457, 0.17228436470031738, 0.1758747398853302, 0.17946510016918182, 0.18305546045303345, 0.18664583563804626, 0.1902361959218979, 0.1938265711069107, 0.19741693139076233, 0.20100730657577515, 0.20459768176078796, 0.2081880420446396, 0.2117784172296524]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 7.0, 6.0, 17.0, 28.0, 23.0, 26.0, 25.0, 32.0, 45.0, 36.0, 55.0, 45.0, 61.0, 59.0, 54.0, 60.0, 54.0, 55.0, 57.0, 48.0, 37.0, 45.0, 31.0, 22.0, 12.0, 22.0, 17.0, 16.0, 6.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.013411343097686768, -0.012956619262695312, -0.012501895427703857, -0.012047171592712402, -0.011592447757720947, -0.011137723922729492, -0.010683000087738037, -0.010228276252746582, -0.009773552417755127, -0.009318828582763672, -0.008864104747772217, -0.008409380912780762, -0.007954657077789307, -0.0074999332427978516, -0.0070452094078063965, -0.006590485572814941, -0.006135761737823486, -0.005681037902832031, -0.005226314067840576, -0.004771590232849121, -0.004316866397857666, -0.003862142562866211, -0.003407418727874756, -0.0029526948928833008, -0.0024979710578918457, -0.0020432472229003906, -0.0015885233879089355, -0.0011337995529174805, -0.0006790757179260254, -0.0002243518829345703, 0.00023037195205688477, 0.0006850957870483398, 0.001139819622039795, 0.00159454345703125, 0.002049267292022705, 0.00250399112701416, 0.0029587149620056152, 0.0034134387969970703, 0.0038681626319885254, 0.0043228864669799805, 0.0047776103019714355, 0.005232334136962891, 0.005687057971954346, 0.006141781806945801, 0.006596505641937256, 0.007051229476928711, 0.007505953311920166, 0.007960677146911621, 0.008415400981903076, 0.008870124816894531, 0.009324848651885986, 0.009779572486877441, 0.010234296321868896, 0.010689020156860352, 0.011143743991851807, 0.011598467826843262, 0.012053191661834717, 0.012507915496826172, 0.012962639331817627, 0.013417363166809082, 0.013872087001800537, 0.014326810836791992, 0.014781534671783447, 0.015236258506774902, 0.015690982341766357]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 7.0, 6.0, 9.0, 10.0, 8.0, 15.0, 19.0, 9.0, 20.0, 17.0, 22.0, 26.0, 33.0, 34.0, 39.0, 42.0, 37.0, 52.0, 40.0, 34.0, 38.0, 61.0, 48.0, 37.0, 42.0, 51.0, 33.0, 25.0, 35.0, 26.0, 33.0, 15.0, 8.0, 19.0, 10.0, 7.0, 11.0, 8.0, 9.0, 5.0, 3.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.7265625, -8.4281005859375, -8.129638671875, -7.8311767578125, -7.53271484375, -7.2342529296875, -6.935791015625, -6.6373291015625, -6.3388671875, -6.0404052734375, -5.741943359375, -5.4434814453125, -5.14501953125, -4.8465576171875, -4.548095703125, -4.2496337890625, -3.951171875, -3.6527099609375, -3.354248046875, -3.0557861328125, -2.75732421875, -2.4588623046875, -2.160400390625, -1.8619384765625, -1.5634765625, -1.2650146484375, -0.966552734375, -0.6680908203125, -0.36962890625, -0.0711669921875, 0.227294921875, 0.5257568359375, 0.82421875, 1.1226806640625, 1.421142578125, 1.7196044921875, 2.01806640625, 2.3165283203125, 2.614990234375, 2.9134521484375, 3.2119140625, 3.5103759765625, 3.808837890625, 4.1072998046875, 4.40576171875, 4.7042236328125, 5.002685546875, 5.3011474609375, 5.599609375, 5.8980712890625, 6.196533203125, 6.4949951171875, 6.79345703125, 7.0919189453125, 7.390380859375, 7.6888427734375, 7.9873046875, 8.2857666015625, 8.584228515625, 8.8826904296875, 9.18115234375, 9.4796142578125, 9.778076171875, 10.0765380859375, 10.375]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 6.0, 12.0, 19.0, 27.0, 41.0, 64.0, 103.0, 183.0, 265.0, 419.0, 800.0, 1461.0, 2711.0, 5525.0, 12650.0, 30805.0, 84744.0, 283809.0, 422149.0, 126928.0, 43626.0, 17270.0, 7394.0, 3439.0, 1745.0, 950.0, 552.0, 331.0, 191.0, 121.0, 78.0, 44.0, 31.0, 22.0, 16.0, 11.0, 7.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-8.9140625, -8.65325927734375, -8.3924560546875, -8.13165283203125, -7.870849609375, -7.61004638671875, -7.3492431640625, -7.08843994140625, -6.82763671875, -6.56683349609375, -6.3060302734375, -6.04522705078125, -5.784423828125, -5.52362060546875, -5.2628173828125, -5.00201416015625, -4.7412109375, -4.48040771484375, -4.2196044921875, -3.95880126953125, -3.697998046875, -3.43719482421875, -3.1763916015625, -2.91558837890625, -2.65478515625, -2.39398193359375, -2.1331787109375, -1.87237548828125, -1.611572265625, -1.35076904296875, -1.0899658203125, -0.82916259765625, -0.568359375, -0.30755615234375, -0.0467529296875, 0.21405029296875, 0.474853515625, 0.73565673828125, 0.9964599609375, 1.25726318359375, 1.51806640625, 1.77886962890625, 2.0396728515625, 2.30047607421875, 2.561279296875, 2.82208251953125, 3.0828857421875, 3.34368896484375, 3.6044921875, 3.86529541015625, 4.1260986328125, 4.38690185546875, 4.647705078125, 4.90850830078125, 5.1693115234375, 5.43011474609375, 5.69091796875, 5.95172119140625, 6.2125244140625, 6.47332763671875, 6.734130859375, 6.99493408203125, 7.2557373046875, 7.51654052734375, 7.77734375]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 6.0, 5.0, 7.0, 3.0, 13.0, 11.0, 17.0, 14.0, 15.0, 31.0, 38.0, 35.0, 32.0, 55.0, 67.0, 71.0, 132.0, 1641.0, 346.0, 110.0, 64.0, 67.0, 40.0, 38.0, 44.0, 28.0, 26.0, 27.0, 11.0, 18.0, 15.0, 8.0, 5.0, 6.0, 4.0, 1.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-49.75, -48.32275390625, -46.8955078125, -45.46826171875, -44.041015625, -42.61376953125, -41.1865234375, -39.75927734375, -38.33203125, -36.90478515625, -35.4775390625, -34.05029296875, -32.623046875, -31.19580078125, -29.7685546875, -28.34130859375, -26.9140625, -25.48681640625, -24.0595703125, -22.63232421875, -21.205078125, -19.77783203125, -18.3505859375, -16.92333984375, -15.49609375, -14.06884765625, -12.6416015625, -11.21435546875, -9.787109375, -8.35986328125, -6.9326171875, -5.50537109375, -4.078125, -2.65087890625, -1.2236328125, 0.20361328125, 1.630859375, 3.05810546875, 4.4853515625, 5.91259765625, 7.33984375, 8.76708984375, 10.1943359375, 11.62158203125, 13.048828125, 14.47607421875, 15.9033203125, 17.33056640625, 18.7578125, 20.18505859375, 21.6123046875, 23.03955078125, 24.466796875, 25.89404296875, 27.3212890625, 28.74853515625, 30.17578125, 31.60302734375, 33.0302734375, 34.45751953125, 35.884765625, 37.31201171875, 38.7392578125, 40.16650390625, 41.59375]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 4.0, 10.0, 6.0, 9.0, 11.0, 23.0, 20.0, 35.0, 43.0, 64.0, 77.0, 136.0, 131.0, 224.0, 454.0, 1288.0, 63494.0, 3072843.0, 5184.0, 665.0, 317.0, 206.0, 110.0, 95.0, 78.0, 58.0, 25.0, 25.0, 22.0, 14.0, 11.0, 7.0, 9.0, 3.0, 6.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-93.6875, -90.4853515625, -87.283203125, -84.0810546875, -80.87890625, -77.6767578125, -74.474609375, -71.2724609375, -68.0703125, -64.8681640625, -61.666015625, -58.4638671875, -55.26171875, -52.0595703125, -48.857421875, -45.6552734375, -42.453125, -39.2509765625, -36.048828125, -32.8466796875, -29.64453125, -26.4423828125, -23.240234375, -20.0380859375, -16.8359375, -13.6337890625, -10.431640625, -7.2294921875, -4.02734375, -0.8251953125, 2.376953125, 5.5791015625, 8.78125, 11.9833984375, 15.185546875, 18.3876953125, 21.58984375, 24.7919921875, 27.994140625, 31.1962890625, 34.3984375, 37.6005859375, 40.802734375, 44.0048828125, 47.20703125, 50.4091796875, 53.611328125, 56.8134765625, 60.015625, 63.2177734375, 66.419921875, 69.6220703125, 72.82421875, 76.0263671875, 79.228515625, 82.4306640625, 85.6328125, 88.8349609375, 92.037109375, 95.2392578125, 98.44140625, 101.6435546875, 104.845703125, 108.0478515625, 111.25]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 29.0, 146.0, 385.0, 337.0, 104.0, 9.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-214.38636779785156, -210.08706665039062, -205.78775024414062, -201.4884490966797, -197.1891326904297, -192.88983154296875, -188.59051513671875, -184.2912139892578, -179.9918975830078, -175.69259643554688, -171.39328002929688, -167.09397888183594, -162.79466247558594, -158.495361328125, -154.196044921875, -149.89674377441406, -145.59744262695312, -141.2981414794922, -136.9988250732422, -132.69952392578125, -128.40020751953125, -124.10089874267578, -119.80158996582031, -115.50228881835938, -111.20297241210938, -106.9036636352539, -102.60435485839844, -98.30504608154297, -94.0057373046875, -89.70642852783203, -85.40711975097656, -81.10781860351562, -76.80850982666016, -72.50920104980469, -68.20989227294922, -63.91058349609375, -59.61127471923828, -55.31196594238281, -51.01266098022461, -46.71335220336914, -42.41404342651367, -38.1147346496582, -33.815425872802734, -29.5161190032959, -25.21681022644043, -20.91750144958496, -16.618194580078125, -12.318885803222656, -8.019577026367188, -3.720268726348877, 0.5790395736694336, 4.878347396850586, 9.177656173706055, 13.476964950561523, 17.77627182006836, 22.075580596923828, 26.374889373779297, 30.674198150634766, 34.973506927490234, 39.27281188964844, 43.572120666503906, 47.871429443359375, 52.170738220214844, 56.47004699707031, 60.76935577392578]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 3.0, 6.0, 3.0, 9.0, 5.0, 7.0, 13.0, 13.0, 15.0, 17.0, 12.0, 23.0, 15.0, 24.0, 20.0, 29.0, 34.0, 40.0, 24.0, 34.0, 49.0, 42.0, 55.0, 40.0, 44.0, 30.0, 35.0, 30.0, 40.0, 25.0, 28.0, 33.0, 31.0, 24.0, 20.0, 16.0, 18.0, 19.0, 8.0, 6.0, 13.0, 10.0, 8.0, 8.0, 8.0, 6.0, 0.0, 2.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-75.65803527832031, -73.16386413574219, -70.6697006225586, -68.175537109375, -65.68136596679688, -63.187198638916016, -60.693031311035156, -58.1988639831543, -55.70469665527344, -53.21052932739258, -50.71636199951172, -48.22219467163086, -45.72802734375, -43.23386001586914, -40.73969268798828, -38.24552536010742, -35.75135803222656, -33.2571907043457, -30.763023376464844, -28.268856048583984, -25.774688720703125, -23.280521392822266, -20.786354064941406, -18.292186737060547, -15.798019409179688, -13.303852081298828, -10.809684753417969, -8.31551742553711, -5.82135009765625, -3.3271827697753906, -0.8330154418945312, 1.6611518859863281, 4.155311584472656, 6.649478912353516, 9.143646240234375, 11.637813568115234, 14.131980895996094, 16.626148223876953, 19.120315551757812, 21.614482879638672, 24.10865020751953, 26.60281753540039, 29.09698486328125, 31.59115219116211, 34.08531951904297, 36.57948684692383, 39.07365417480469, 41.56782150268555, 44.061988830566406, 46.556156158447266, 49.050323486328125, 51.544490814208984, 54.038658142089844, 56.5328254699707, 59.02699279785156, 61.52116012573242, 64.01532745361328, 66.50949096679688, 69.003662109375, 71.49783325195312, 73.99199676513672, 76.48616027832031, 78.98033142089844, 81.47450256347656, 83.96866607666016]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 2.0, 7.0, 9.0, 11.0, 6.0, 7.0, 11.0, 23.0, 17.0, 15.0, 15.0, 21.0, 30.0, 24.0, 28.0, 43.0, 42.0, 42.0, 36.0, 41.0, 43.0, 36.0, 42.0, 54.0, 36.0, 46.0, 46.0, 35.0, 32.0, 19.0, 32.0, 26.0, 29.0, 16.0, 13.0, 15.0, 9.0, 8.0, 7.0, 7.0, 7.0, 6.0, 9.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.5390625, -8.2406005859375, -7.942138671875, -7.6436767578125, -7.34521484375, -7.0467529296875, -6.748291015625, -6.4498291015625, -6.1513671875, -5.8529052734375, -5.554443359375, -5.2559814453125, -4.95751953125, -4.6590576171875, -4.360595703125, -4.0621337890625, -3.763671875, -3.4652099609375, -3.166748046875, -2.8682861328125, -2.56982421875, -2.2713623046875, -1.972900390625, -1.6744384765625, -1.3759765625, -1.0775146484375, -0.779052734375, -0.4805908203125, -0.18212890625, 0.1163330078125, 0.414794921875, 0.7132568359375, 1.01171875, 1.3101806640625, 1.608642578125, 1.9071044921875, 2.20556640625, 2.5040283203125, 2.802490234375, 3.1009521484375, 3.3994140625, 3.6978759765625, 3.996337890625, 4.2947998046875, 4.59326171875, 4.8917236328125, 5.190185546875, 5.4886474609375, 5.787109375, 6.0855712890625, 6.384033203125, 6.6824951171875, 6.98095703125, 7.2794189453125, 7.577880859375, 7.8763427734375, 8.1748046875, 8.4732666015625, 8.771728515625, 9.0701904296875, 9.36865234375, 9.6671142578125, 9.965576171875, 10.2640380859375, 10.5625]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 5.0, 5.0, 9.0, 8.0, 4.0, 9.0, 14.0, 17.0, 19.0, 18.0, 19.0, 26.0, 30.0, 36.0, 50.0, 107.0, 214.0, 534.0, 2474.0, 25353.0, 856934.0, 3161951.0, 136867.0, 7669.0, 1141.0, 321.0, 126.0, 85.0, 43.0, 26.0, 26.0, 24.0, 24.0, 19.0, 19.0, 12.0, 5.0, 11.0, 7.0, 3.0, 5.0, 6.0, 6.0, 7.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.15625, -38.984375, -37.8125, -36.640625, -35.46875, -34.296875, -33.125, -31.953125, -30.78125, -29.609375, -28.4375, -27.265625, -26.09375, -24.921875, -23.75, -22.578125, -21.40625, -20.234375, -19.0625, -17.890625, -16.71875, -15.546875, -14.375, -13.203125, -12.03125, -10.859375, -9.6875, -8.515625, -7.34375, -6.171875, -5.0, -3.828125, -2.65625, -1.484375, -0.3125, 0.859375, 2.03125, 3.203125, 4.375, 5.546875, 6.71875, 7.890625, 9.0625, 10.234375, 11.40625, 12.578125, 13.75, 14.921875, 16.09375, 17.265625, 18.4375, 19.609375, 20.78125, 21.953125, 23.125, 24.296875, 25.46875, 26.640625, 27.8125, 28.984375, 30.15625, 31.328125, 32.5, 33.671875, 34.84375]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 8.0, 6.0, 14.0, 22.0, 30.0, 39.0, 75.0, 96.0, 132.0, 193.0, 269.0, 378.0, 521.0, 544.0, 489.0, 364.0, 284.0, 171.0, 138.0, 98.0, 64.0, 40.0, 32.0, 24.0, 18.0, 11.0, 7.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-26.3125, -25.5908203125, -24.869140625, -24.1474609375, -23.42578125, -22.7041015625, -21.982421875, -21.2607421875, -20.5390625, -19.8173828125, -19.095703125, -18.3740234375, -17.65234375, -16.9306640625, -16.208984375, -15.4873046875, -14.765625, -14.0439453125, -13.322265625, -12.6005859375, -11.87890625, -11.1572265625, -10.435546875, -9.7138671875, -8.9921875, -8.2705078125, -7.548828125, -6.8271484375, -6.10546875, -5.3837890625, -4.662109375, -3.9404296875, -3.21875, -2.4970703125, -1.775390625, -1.0537109375, -0.33203125, 0.3896484375, 1.111328125, 1.8330078125, 2.5546875, 3.2763671875, 3.998046875, 4.7197265625, 5.44140625, 6.1630859375, 6.884765625, 7.6064453125, 8.328125, 9.0498046875, 9.771484375, 10.4931640625, 11.21484375, 11.9365234375, 12.658203125, 13.3798828125, 14.1015625, 14.8232421875, 15.544921875, 16.2666015625, 16.98828125, 17.7099609375, 18.431640625, 19.1533203125, 19.875]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 8.0, 2.0, 3.0, 5.0, 9.0, 14.0, 16.0, 31.0, 33.0, 47.0, 60.0, 89.0, 113.0, 198.0, 350.0, 690.0, 1932.0, 10605.0, 171042.0, 3138810.0, 829476.0, 34835.0, 3725.0, 982.0, 434.0, 223.0, 163.0, 111.0, 81.0, 60.0, 38.0, 32.0, 16.0, 16.0, 10.0, 8.0, 7.0, 5.0, 5.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.0625, -40.5986328125, -39.134765625, -37.6708984375, -36.20703125, -34.7431640625, -33.279296875, -31.8154296875, -30.3515625, -28.8876953125, -27.423828125, -25.9599609375, -24.49609375, -23.0322265625, -21.568359375, -20.1044921875, -18.640625, -17.1767578125, -15.712890625, -14.2490234375, -12.78515625, -11.3212890625, -9.857421875, -8.3935546875, -6.9296875, -5.4658203125, -4.001953125, -2.5380859375, -1.07421875, 0.3896484375, 1.853515625, 3.3173828125, 4.78125, 6.2451171875, 7.708984375, 9.1728515625, 10.63671875, 12.1005859375, 13.564453125, 15.0283203125, 16.4921875, 17.9560546875, 19.419921875, 20.8837890625, 22.34765625, 23.8115234375, 25.275390625, 26.7392578125, 28.203125, 29.6669921875, 31.130859375, 32.5947265625, 34.05859375, 35.5224609375, 36.986328125, 38.4501953125, 39.9140625, 41.3779296875, 42.841796875, 44.3056640625, 45.76953125, 47.2333984375, 48.697265625, 50.1611328125, 51.625]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 4.0, 9.0, 16.0, 31.0, 30.0, 58.0, 71.0, 81.0, 108.0, 118.0, 121.0, 99.0, 86.0, 61.0, 50.0, 24.0, 19.0, 10.0, 11.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-97.73302459716797, -94.63463592529297, -91.53624725341797, -88.4378662109375, -85.3394775390625, -82.2410888671875, -79.1427001953125, -76.0443115234375, -72.9459228515625, -69.8475341796875, -66.7491455078125, -63.650760650634766, -60.55237579345703, -57.45398712158203, -54.35559844970703, -51.25720977783203, -48.15882873535156, -45.06044006347656, -41.96205520629883, -38.86366653442383, -35.765281677246094, -32.666893005371094, -29.568504333496094, -26.470117568969727, -23.37173080444336, -20.273344039916992, -17.174957275390625, -14.076568603515625, -10.978181838989258, -7.879795074462891, -4.781406402587891, -1.6830196380615234, 1.4153594970703125, 4.513746738433838, 7.612133979797363, 10.710521697998047, 13.808908462524414, 16.90729522705078, 20.00568389892578, 23.10407066345215, 26.202457427978516, 29.300844192504883, 32.39923095703125, 35.49761962890625, 38.59600830078125, 41.694393157958984, 44.792781829833984, 47.89116668701172, 50.98955535888672, 54.08794403076172, 57.18632888793945, 60.28471755981445, 63.38310241699219, 66.48149108886719, 69.57987976074219, 72.67826843261719, 75.77665710449219, 78.87504577636719, 81.97343444824219, 85.07182312011719, 88.17020416259766, 91.26859283447266, 94.36698150634766, 97.46537017822266, 100.56375122070312]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 4.0, 3.0, 6.0, 11.0, 13.0, 10.0, 17.0, 21.0, 18.0, 22.0, 21.0, 11.0, 27.0, 38.0, 39.0, 33.0, 41.0, 34.0, 37.0, 43.0, 42.0, 51.0, 40.0, 45.0, 24.0, 36.0, 42.0, 38.0, 39.0, 30.0, 18.0, 24.0, 19.0, 18.0, 15.0, 17.0, 8.0, 9.0, 11.0, 8.0, 7.0, 7.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-57.74072265625, -55.865501403808594, -53.99028015136719, -52.11505889892578, -50.239837646484375, -48.36461639404297, -46.48939514160156, -44.614173889160156, -42.73895263671875, -40.863731384277344, -38.98851013183594, -37.11328887939453, -35.238067626953125, -33.36284637451172, -31.487625122070312, -29.612403869628906, -27.7371826171875, -25.861961364746094, -23.986740112304688, -22.11151885986328, -20.236297607421875, -18.36107635498047, -16.485855102539062, -14.610633850097656, -12.73541259765625, -10.860191345214844, -8.984970092773438, -7.109748840332031, -5.234527587890625, -3.3593063354492188, -1.4840850830078125, 0.39113616943359375, 2.266357421875, 4.141578674316406, 6.0167999267578125, 7.892021179199219, 9.767242431640625, 11.642463684082031, 13.517684936523438, 15.392906188964844, 17.26812744140625, 19.143348693847656, 21.018569946289062, 22.89379119873047, 24.769012451171875, 26.64423370361328, 28.519454956054688, 30.394676208496094, 32.2698974609375, 34.145118713378906, 36.02033996582031, 37.89556121826172, 39.770782470703125, 41.64600372314453, 43.52122497558594, 45.396446228027344, 47.27166748046875, 49.146888732910156, 51.02210998535156, 52.89733123779297, 54.772552490234375, 56.64777374267578, 58.52299499511719, 60.398216247558594, 62.2734375]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 4.0, 2.0, 6.0, 6.0, 4.0, 8.0, 12.0, 16.0, 8.0, 19.0, 16.0, 14.0, 23.0, 25.0, 21.0, 32.0, 28.0, 29.0, 39.0, 30.0, 31.0, 35.0, 46.0, 37.0, 32.0, 38.0, 31.0, 39.0, 42.0, 38.0, 31.0, 39.0, 25.0, 29.0, 24.0, 20.0, 16.0, 12.0, 19.0, 14.0, 13.0, 2.0, 8.0, 6.0, 8.0, 5.0, 8.0, 6.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.8515625, -7.592041015625, -7.33251953125, -7.072998046875, -6.8134765625, -6.553955078125, -6.29443359375, -6.034912109375, -5.775390625, -5.515869140625, -5.25634765625, -4.996826171875, -4.7373046875, -4.477783203125, -4.21826171875, -3.958740234375, -3.69921875, -3.439697265625, -3.18017578125, -2.920654296875, -2.6611328125, -2.401611328125, -2.14208984375, -1.882568359375, -1.623046875, -1.363525390625, -1.10400390625, -0.844482421875, -0.5849609375, -0.325439453125, -0.06591796875, 0.193603515625, 0.453125, 0.712646484375, 0.97216796875, 1.231689453125, 1.4912109375, 1.750732421875, 2.01025390625, 2.269775390625, 2.529296875, 2.788818359375, 3.04833984375, 3.307861328125, 3.5673828125, 3.826904296875, 4.08642578125, 4.345947265625, 4.60546875, 4.864990234375, 5.12451171875, 5.384033203125, 5.6435546875, 5.903076171875, 6.16259765625, 6.422119140625, 6.681640625, 6.941162109375, 7.20068359375, 7.460205078125, 7.7197265625, 7.979248046875, 8.23876953125, 8.498291015625, 8.7578125]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [5.0, 2.0, 4.0, 6.0, 11.0, 15.0, 19.0, 38.0, 50.0, 78.0, 132.0, 178.0, 207.0, 397.0, 512.0, 725.0, 1023.0, 1550.0, 2104.0, 3060.0, 4386.0, 6306.0, 9110.0, 13149.0, 19396.0, 28282.0, 41670.0, 61046.0, 89038.0, 123889.0, 153194.0, 142285.0, 108273.0, 75224.0, 51640.0, 35003.0, 23787.0, 16223.0, 11062.0, 7784.0, 5352.0, 3737.0, 2600.0, 1834.0, 1341.0, 890.0, 576.0, 440.0, 364.0, 190.0, 133.0, 81.0, 51.0, 27.0, 31.0, 15.0, 21.0, 6.0, 9.0, 8.0, 1.0, 3.0, 0.0, 3.0], "bins": [-0.60107421875, -0.58154296875, -0.56201171875, -0.54248046875, -0.52294921875, -0.50341796875, -0.48388671875, -0.46435546875, -0.44482421875, -0.42529296875, -0.40576171875, -0.38623046875, -0.36669921875, -0.34716796875, -0.32763671875, -0.30810546875, -0.28857421875, -0.26904296875, -0.24951171875, -0.22998046875, -0.21044921875, -0.19091796875, -0.17138671875, -0.15185546875, -0.13232421875, -0.11279296875, -0.09326171875, -0.07373046875, -0.05419921875, -0.03466796875, -0.01513671875, 0.00439453125, 0.02392578125, 0.04345703125, 0.06298828125, 0.08251953125, 0.10205078125, 0.12158203125, 0.14111328125, 0.16064453125, 0.18017578125, 0.19970703125, 0.21923828125, 0.23876953125, 0.25830078125, 0.27783203125, 0.29736328125, 0.31689453125, 0.33642578125, 0.35595703125, 0.37548828125, 0.39501953125, 0.41455078125, 0.43408203125, 0.45361328125, 0.47314453125, 0.49267578125, 0.51220703125, 0.53173828125, 0.55126953125, 0.57080078125, 0.59033203125, 0.60986328125, 0.62939453125, 0.64892578125]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 7.0, 7.0, 9.0, 8.0, 6.0, 13.0, 11.0, 13.0, 23.0, 17.0, 24.0, 24.0, 26.0, 30.0, 32.0, 31.0, 48.0, 37.0, 44.0, 43.0, 35.0, 55.0, 1069.0, 43.0, 37.0, 32.0, 35.0, 38.0, 24.0, 24.0, 18.0, 29.0, 24.0, 20.0, 16.0, 14.0, 15.0, 6.0, 8.0, 3.0, 5.0, 6.0, 6.0, 8.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.953125, -5.77301025390625, -5.5928955078125, -5.41278076171875, -5.232666015625, -5.05255126953125, -4.8724365234375, -4.69232177734375, -4.51220703125, -4.33209228515625, -4.1519775390625, -3.97186279296875, -3.791748046875, -3.61163330078125, -3.4315185546875, -3.25140380859375, -3.0712890625, -2.89117431640625, -2.7110595703125, -2.53094482421875, -2.350830078125, -2.17071533203125, -1.9906005859375, -1.81048583984375, -1.63037109375, -1.45025634765625, -1.2701416015625, -1.09002685546875, -0.909912109375, -0.72979736328125, -0.5496826171875, -0.36956787109375, -0.189453125, -0.00933837890625, 0.1707763671875, 0.35089111328125, 0.531005859375, 0.71112060546875, 0.8912353515625, 1.07135009765625, 1.25146484375, 1.43157958984375, 1.6116943359375, 1.79180908203125, 1.971923828125, 2.15203857421875, 2.3321533203125, 2.51226806640625, 2.6923828125, 2.87249755859375, 3.0526123046875, 3.23272705078125, 3.412841796875, 3.59295654296875, 3.7730712890625, 3.95318603515625, 4.13330078125, 4.31341552734375, 4.4935302734375, 4.67364501953125, 4.853759765625, 5.03387451171875, 5.2139892578125, 5.39410400390625, 5.57421875]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 3.0, 8.0, 10.0, 20.0, 16.0, 21.0, 38.0, 48.0, 70.0, 98.0, 147.0, 226.0, 349.0, 485.0, 812.0, 1249.0, 1883.0, 2776.0, 4137.0, 6624.0, 10130.0, 15759.0, 24299.0, 37311.0, 57233.0, 83667.0, 117395.0, 326961.0, 1005747.0, 127258.0, 91139.0, 62533.0, 41448.0, 26951.0, 17462.0, 11507.0, 7389.0, 4812.0, 3086.0, 2014.0, 1360.0, 912.0, 566.0, 407.0, 253.0, 158.0, 121.0, 83.0, 52.0, 45.0, 28.0, 10.0, 6.0, 7.0, 6.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.4091796875, -0.3951263427734375, -0.381072998046875, -0.3670196533203125, -0.35296630859375, -0.3389129638671875, -0.324859619140625, -0.3108062744140625, -0.2967529296875, -0.2826995849609375, -0.268646240234375, -0.2545928955078125, -0.24053955078125, -0.2264862060546875, -0.212432861328125, -0.1983795166015625, -0.184326171875, -0.1702728271484375, -0.156219482421875, -0.1421661376953125, -0.12811279296875, -0.1140594482421875, -0.100006103515625, -0.0859527587890625, -0.0718994140625, -0.0578460693359375, -0.043792724609375, -0.0297393798828125, -0.01568603515625, -0.0016326904296875, 0.012420654296875, 0.0264739990234375, 0.04052734375, 0.0545806884765625, 0.068634033203125, 0.0826873779296875, 0.09674072265625, 0.1107940673828125, 0.124847412109375, 0.1389007568359375, 0.1529541015625, 0.1670074462890625, 0.181060791015625, 0.1951141357421875, 0.20916748046875, 0.2232208251953125, 0.237274169921875, 0.2513275146484375, 0.265380859375, 0.2794342041015625, 0.293487548828125, 0.3075408935546875, 0.32159423828125, 0.3356475830078125, 0.349700927734375, 0.3637542724609375, 0.3778076171875, 0.3918609619140625, 0.405914306640625, 0.4199676513671875, 0.43402099609375, 0.4480743408203125, 0.462127685546875, 0.4761810302734375, 0.490234375]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 5.0, 2.0, 0.0, 3.0, 3.0, 3.0, 5.0, 2.0, 3.0, 12.0, 15.0, 14.0, 19.0, 29.0, 35.0, 25.0, 45.0, 35.0, 67.0, 65.0, 71.0, 101.0, 80.0, 56.0, 60.0, 47.0, 41.0, 28.0, 28.0, 19.0, 19.0, 12.0, 7.0, 9.0, 8.0, 6.0, 5.0, 5.0, 3.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.020751953125, -0.02011251449584961, -0.01947307586669922, -0.018833637237548828, -0.018194198608398438, -0.017554759979248047, -0.016915321350097656, -0.016275882720947266, -0.015636444091796875, -0.014997005462646484, -0.014357566833496094, -0.013718128204345703, -0.013078689575195312, -0.012439250946044922, -0.011799812316894531, -0.01116037368774414, -0.01052093505859375, -0.00988149642944336, -0.009242057800292969, -0.008602619171142578, -0.007963180541992188, -0.007323741912841797, -0.006684303283691406, -0.006044864654541016, -0.005405426025390625, -0.004765987396240234, -0.004126548767089844, -0.003487110137939453, -0.0028476715087890625, -0.002208232879638672, -0.0015687942504882812, -0.0009293556213378906, -0.0002899169921875, 0.0003495216369628906, 0.0009889602661132812, 0.0016283988952636719, 0.0022678375244140625, 0.002907276153564453, 0.0035467147827148438, 0.004186153411865234, 0.004825592041015625, 0.005465030670166016, 0.006104469299316406, 0.006743907928466797, 0.0073833465576171875, 0.008022785186767578, 0.008662223815917969, 0.00930166244506836, 0.00994110107421875, 0.01058053970336914, 0.011219978332519531, 0.011859416961669922, 0.012498855590820312, 0.013138294219970703, 0.013777732849121094, 0.014417171478271484, 0.015056610107421875, 0.015696048736572266, 0.016335487365722656, 0.016974925994873047, 0.017614364624023438, 0.018253803253173828, 0.01889324188232422, 0.01953268051147461, 0.020172119140625]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 3.0, 5.0, 7.0, 12.0, 7.0, 13.0, 13.0, 21.0, 34.0, 45.0, 55.0, 106.0, 160.0, 353.0, 2078.0, 705780.0, 337431.0, 1580.0, 341.0, 177.0, 102.0, 48.0, 46.0, 31.0, 27.0, 30.0, 9.0, 8.0, 3.0, 4.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.464111328125, -0.4495887756347656, -0.43506622314453125, -0.4205436706542969, -0.4060211181640625, -0.3914985656738281, -0.37697601318359375, -0.3624534606933594, -0.347930908203125, -0.3334083557128906, -0.31888580322265625, -0.3043632507324219, -0.2898406982421875, -0.2753181457519531, -0.26079559326171875, -0.24627304077148438, -0.23175048828125, -0.21722793579101562, -0.20270538330078125, -0.18818283081054688, -0.1736602783203125, -0.15913772583007812, -0.14461517333984375, -0.13009262084960938, -0.115570068359375, -0.10104751586914062, -0.08652496337890625, -0.07200241088867188, -0.0574798583984375, -0.042957305908203125, -0.02843475341796875, -0.013912200927734375, 0.0006103515625, 0.015132904052734375, 0.02965545654296875, 0.044178009033203125, 0.0587005615234375, 0.07322311401367188, 0.08774566650390625, 0.10226821899414062, 0.116790771484375, 0.13131332397460938, 0.14583587646484375, 0.16035842895507812, 0.1748809814453125, 0.18940353393554688, 0.20392608642578125, 0.21844863891601562, 0.23297119140625, 0.24749374389648438, 0.26201629638671875, 0.2765388488769531, 0.2910614013671875, 0.3055839538574219, 0.32010650634765625, 0.3346290588378906, 0.349151611328125, 0.3636741638183594, 0.37819671630859375, 0.3927192687988281, 0.4072418212890625, 0.4217643737792969, 0.43628692626953125, 0.4508094787597656, 0.46533203125]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [4.0, 39.0, 392.0, 526.0, 48.0, 9.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00971305277198553, -0.006579868495464325, -0.0034466846846044064, -0.00031350087374448776, 0.002819683402776718, 0.005952867679297924, 0.009086051024496555, 0.012219236232340336, 0.015352419577538967, 0.018485603854060173, 0.021618787199258804, 0.024751972407102585, 0.027885155752301216, 0.031018339097499847, 0.03415152430534363, 0.03728470951318741, 0.04041789099574089, 0.04355107620358467, 0.04668425768613815, 0.049817442893981934, 0.052950628101825714, 0.056083813309669495, 0.05921699479222298, 0.06235018000006676, 0.06548336148262024, 0.06861654669046402, 0.0717497318983078, 0.07488290965557098, 0.07801609486341476, 0.08114928007125854, 0.08428246527910233, 0.0874156504869461, 0.09054883569478989, 0.09368202090263367, 0.09681520611047745, 0.09994839131832123, 0.10308156907558441, 0.10621475428342819, 0.10934793949127197, 0.11248112469911575, 0.11561430990695953, 0.11874749511480331, 0.1218806803226471, 0.12501385807991028, 0.12814705073833466, 0.13128022849559784, 0.13441342115402222, 0.1375465989112854, 0.14067977666854858, 0.14381295442581177, 0.14694614708423615, 0.15007932484149933, 0.1532125174999237, 0.1563456952571869, 0.15947887301445007, 0.16261206567287445, 0.16574525833129883, 0.168878436088562, 0.1720116287469864, 0.17514480650424957, 0.17827799916267395, 0.18141117691993713, 0.18454435467720032, 0.1876775473356247, 0.19081072509288788]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 2.0, 4.0, 8.0, 3.0, 11.0, 13.0, 19.0, 26.0, 22.0, 25.0, 31.0, 37.0, 52.0, 56.0, 61.0, 57.0, 62.0, 41.0, 59.0, 55.0, 55.0, 59.0, 54.0, 36.0, 35.0, 29.0, 25.0, 19.0, 20.0, 14.0, 8.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.019249439239501953, -0.01865636743605137, -0.018063295632600784, -0.0174702238291502, -0.016877152025699615, -0.01628408022224903, -0.015691008418798447, -0.015097936615347862, -0.014504864811897278, -0.013911793008446693, -0.013318721204996109, -0.012725649401545525, -0.01213257759809494, -0.011539505794644356, -0.010946433991193771, -0.010353362187743187, -0.009760290384292603, -0.009167218580842018, -0.008574146777391434, -0.00798107497394085, -0.007388003170490265, -0.0067949313670396805, -0.006201859563589096, -0.005608787760138512, -0.005015715956687927, -0.004422644153237343, -0.0038295723497867584, -0.003236500546336174, -0.0026434287428855896, -0.002050356939435005, -0.0014572851359844208, -0.0008642133325338364, -0.00027114152908325195, 0.00032193027436733246, 0.0009150020778179169, 0.0015080738812685013, 0.0021011456847190857, 0.00269421748816967, 0.0032872892916202545, 0.003880361095070839, 0.004473432898521423, 0.005066504701972008, 0.005659576505422592, 0.006252648308873177, 0.006845720112323761, 0.007438791915774345, 0.00803186371922493, 0.008624935522675514, 0.009218007326126099, 0.009811079129576683, 0.010404150933027267, 0.010997222736477852, 0.011590294539928436, 0.01218336634337902, 0.012776438146829605, 0.01336950995028019, 0.013962581753730774, 0.014555653557181358, 0.015148725360631943, 0.015741797164082527, 0.01633486896753311, 0.016927940770983696, 0.01752101257443428, 0.018114084377884865, 0.01870715618133545]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 4.0, 2.0, 6.0, 6.0, 4.0, 8.0, 12.0, 16.0, 8.0, 19.0, 16.0, 14.0, 23.0, 25.0, 21.0, 32.0, 28.0, 29.0, 39.0, 30.0, 31.0, 35.0, 46.0, 37.0, 32.0, 38.0, 31.0, 39.0, 42.0, 38.0, 31.0, 39.0, 25.0, 29.0, 24.0, 20.0, 16.0, 12.0, 19.0, 14.0, 13.0, 2.0, 8.0, 6.0, 8.0, 5.0, 8.0, 6.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.8515625, -7.592041015625, -7.33251953125, -7.072998046875, -6.8134765625, -6.553955078125, -6.29443359375, -6.034912109375, -5.775390625, -5.515869140625, -5.25634765625, -4.996826171875, -4.7373046875, -4.477783203125, -4.21826171875, -3.958740234375, -3.69921875, -3.439697265625, -3.18017578125, -2.920654296875, -2.6611328125, -2.401611328125, -2.14208984375, -1.882568359375, -1.623046875, -1.363525390625, -1.10400390625, -0.844482421875, -0.5849609375, -0.325439453125, -0.06591796875, 0.193603515625, 0.453125, 0.712646484375, 0.97216796875, 1.231689453125, 1.4912109375, 1.750732421875, 2.01025390625, 2.269775390625, 2.529296875, 2.788818359375, 3.04833984375, 3.307861328125, 3.5673828125, 3.826904296875, 4.08642578125, 4.345947265625, 4.60546875, 4.864990234375, 5.12451171875, 5.384033203125, 5.6435546875, 5.903076171875, 6.16259765625, 6.422119140625, 6.681640625, 6.941162109375, 7.20068359375, 7.460205078125, 7.7197265625, 7.979248046875, 8.23876953125, 8.498291015625, 8.7578125]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 8.0, 15.0, 13.0, 29.0, 38.0, 55.0, 83.0, 122.0, 162.0, 217.0, 406.0, 557.0, 845.0, 1220.0, 2056.0, 3181.0, 5138.0, 8558.0, 14320.0, 25783.0, 49401.0, 103767.0, 239588.0, 317889.0, 135930.0, 62868.0, 31952.0, 17452.0, 10228.0, 6082.0, 3759.0, 2468.0, 1463.0, 981.0, 626.0, 408.0, 262.0, 209.0, 124.0, 94.0, 67.0, 37.0, 30.0, 24.0, 17.0, 5.0, 8.0, 5.0, 1.0, 4.0, 1.0, 2.0], "bins": [-6.9765625, -6.7781982421875, -6.579833984375, -6.3814697265625, -6.18310546875, -5.9847412109375, -5.786376953125, -5.5880126953125, -5.3896484375, -5.1912841796875, -4.992919921875, -4.7945556640625, -4.59619140625, -4.3978271484375, -4.199462890625, -4.0010986328125, -3.802734375, -3.6043701171875, -3.406005859375, -3.2076416015625, -3.00927734375, -2.8109130859375, -2.612548828125, -2.4141845703125, -2.2158203125, -2.0174560546875, -1.819091796875, -1.6207275390625, -1.42236328125, -1.2239990234375, -1.025634765625, -0.8272705078125, -0.62890625, -0.4305419921875, -0.232177734375, -0.0338134765625, 0.16455078125, 0.3629150390625, 0.561279296875, 0.7596435546875, 0.9580078125, 1.1563720703125, 1.354736328125, 1.5531005859375, 1.75146484375, 1.9498291015625, 2.148193359375, 2.3465576171875, 2.544921875, 2.7432861328125, 2.941650390625, 3.1400146484375, 3.33837890625, 3.5367431640625, 3.735107421875, 3.9334716796875, 4.1318359375, 4.3302001953125, 4.528564453125, 4.7269287109375, 4.92529296875, 5.1236572265625, 5.322021484375, 5.5203857421875, 5.71875]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 8.0, 3.0, 4.0, 15.0, 13.0, 12.0, 12.0, 23.0, 13.0, 20.0, 21.0, 27.0, 29.0, 45.0, 36.0, 56.0, 52.0, 69.0, 179.0, 1657.0, 244.0, 97.0, 63.0, 40.0, 46.0, 42.0, 45.0, 32.0, 20.0, 28.0, 28.0, 10.0, 8.0, 14.0, 12.0, 8.0, 7.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-35.40625, -34.287109375, -33.16796875, -32.048828125, -30.9296875, -29.810546875, -28.69140625, -27.572265625, -26.453125, -25.333984375, -24.21484375, -23.095703125, -21.9765625, -20.857421875, -19.73828125, -18.619140625, -17.5, -16.380859375, -15.26171875, -14.142578125, -13.0234375, -11.904296875, -10.78515625, -9.666015625, -8.546875, -7.427734375, -6.30859375, -5.189453125, -4.0703125, -2.951171875, -1.83203125, -0.712890625, 0.40625, 1.525390625, 2.64453125, 3.763671875, 4.8828125, 6.001953125, 7.12109375, 8.240234375, 9.359375, 10.478515625, 11.59765625, 12.716796875, 13.8359375, 14.955078125, 16.07421875, 17.193359375, 18.3125, 19.431640625, 20.55078125, 21.669921875, 22.7890625, 23.908203125, 25.02734375, 26.146484375, 27.265625, 28.384765625, 29.50390625, 30.623046875, 31.7421875, 32.861328125, 33.98046875, 35.099609375, 36.21875]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 2.0, 2.0, 5.0, 7.0, 10.0, 12.0, 20.0, 24.0, 27.0, 62.0, 70.0, 101.0, 157.0, 208.0, 379.0, 903.0, 10545.0, 3097847.0, 32893.0, 1263.0, 405.0, 206.0, 155.0, 110.0, 81.0, 41.0, 49.0, 28.0, 22.0, 23.0, 20.0, 11.0, 9.0, 7.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0], "bins": [-118.6875, -115.61328125, -112.5390625, -109.46484375, -106.390625, -103.31640625, -100.2421875, -97.16796875, -94.09375, -91.01953125, -87.9453125, -84.87109375, -81.796875, -78.72265625, -75.6484375, -72.57421875, -69.5, -66.42578125, -63.3515625, -60.27734375, -57.203125, -54.12890625, -51.0546875, -47.98046875, -44.90625, -41.83203125, -38.7578125, -35.68359375, -32.609375, -29.53515625, -26.4609375, -23.38671875, -20.3125, -17.23828125, -14.1640625, -11.08984375, -8.015625, -4.94140625, -1.8671875, 1.20703125, 4.28125, 7.35546875, 10.4296875, 13.50390625, 16.578125, 19.65234375, 22.7265625, 25.80078125, 28.875, 31.94921875, 35.0234375, 38.09765625, 41.171875, 44.24609375, 47.3203125, 50.39453125, 53.46875, 56.54296875, 59.6171875, 62.69140625, 65.765625, 68.83984375, 71.9140625, 74.98828125, 78.0625]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [2.0, 21.0, 224.0, 627.0, 137.0, 7.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.91394805908203, -17.59988784790039, -10.285826683044434, -2.9717655181884766, 4.342294692993164, 11.656356811523438, 18.970417022705078, 26.28447723388672, 33.59853744506836, 40.91259765625, 48.22665786743164, 55.54071807861328, 62.85478210449219, 70.16883850097656, 77.48290252685547, 84.79696655273438, 92.11102294921875, 99.42508697509766, 106.73914337158203, 114.05320739746094, 121.36726379394531, 128.68133544921875, 135.99539184570312, 143.3094482421875, 150.62350463867188, 157.93756103515625, 165.2516326904297, 172.56568908691406, 179.87974548339844, 187.19381713867188, 194.50787353515625, 201.82192993164062, 209.13600158691406, 216.45005798339844, 223.76412963867188, 231.07818603515625, 238.39224243164062, 245.706298828125, 253.02037048339844, 260.33441162109375, 267.64849853515625, 274.9625549316406, 282.276611328125, 289.5906677246094, 296.9047546386719, 304.21881103515625, 311.5328674316406, 318.846923828125, 326.1609802246094, 333.47503662109375, 340.7890930175781, 348.1031494140625, 355.417236328125, 362.7312927246094, 370.04534912109375, 377.3594055175781, 384.6734619140625, 391.9875183105469, 399.30157470703125, 406.6156311035156, 413.9297180175781, 421.2437744140625, 428.5578308105469, 435.87188720703125, 443.1859436035156]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 4.0, 5.0, 7.0, 7.0, 17.0, 23.0, 14.0, 20.0, 22.0, 17.0, 28.0, 36.0, 33.0, 40.0, 33.0, 39.0, 50.0, 49.0, 49.0, 43.0, 43.0, 42.0, 50.0, 38.0, 41.0, 32.0, 27.0, 21.0, 24.0, 20.0, 24.0, 23.0, 14.0, 13.0, 13.0, 8.0, 9.0, 8.0, 5.0, 1.0, 3.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-89.97756958007812, -86.88311004638672, -83.78865814208984, -80.69419860839844, -77.59973907470703, -74.50528717041016, -71.41082763671875, -68.31637573242188, -65.22191619873047, -62.12746047973633, -59.03300094604492, -55.93854522705078, -52.84408950805664, -49.7496337890625, -46.655174255371094, -43.56071853637695, -40.46625900268555, -37.371803283691406, -34.27734375, -31.18288803100586, -28.08843231201172, -24.993974685668945, -21.899517059326172, -18.80506134033203, -15.710603713989258, -12.6161470413208, -9.521690368652344, -6.42723274230957, -3.3327760696411133, -0.23831939697265625, 2.856138229370117, 5.950593948364258, 9.045051574707031, 12.139508247375488, 15.233964920043945, 18.32842254638672, 21.42287826538086, 24.517335891723633, 27.611793518066406, 30.706249237060547, 33.80070495605469, 36.89516067504883, 39.989620208740234, 43.084075927734375, 46.178531646728516, 49.272987365722656, 52.36744689941406, 55.4619026184082, 58.55636215209961, 61.65081787109375, 64.74527740478516, 67.83973693847656, 70.93418884277344, 74.02864837646484, 77.12310791015625, 80.21755981445312, 83.31201934814453, 86.40647888183594, 89.50093078613281, 92.59539031982422, 95.68984985351562, 98.7843017578125, 101.8787612915039, 104.97322082519531, 108.06767272949219]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 3.0, 3.0, 2.0, 3.0, 5.0, 4.0, 5.0, 3.0, 11.0, 10.0, 11.0, 15.0, 12.0, 16.0, 18.0, 19.0, 10.0, 40.0, 29.0, 25.0, 30.0, 31.0, 28.0, 26.0, 32.0, 31.0, 39.0, 43.0, 38.0, 31.0, 28.0, 45.0, 37.0, 36.0, 29.0, 35.0, 19.0, 38.0, 21.0, 19.0, 18.0, 14.0, 14.0, 13.0, 16.0, 8.0, 5.0, 3.0, 10.0, 9.0, 8.0, 3.0, 3.0, 2.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-8.234375, -7.968505859375, -7.70263671875, -7.436767578125, -7.1708984375, -6.905029296875, -6.63916015625, -6.373291015625, -6.107421875, -5.841552734375, -5.57568359375, -5.309814453125, -5.0439453125, -4.778076171875, -4.51220703125, -4.246337890625, -3.98046875, -3.714599609375, -3.44873046875, -3.182861328125, -2.9169921875, -2.651123046875, -2.38525390625, -2.119384765625, -1.853515625, -1.587646484375, -1.32177734375, -1.055908203125, -0.7900390625, -0.524169921875, -0.25830078125, 0.007568359375, 0.2734375, 0.539306640625, 0.80517578125, 1.071044921875, 1.3369140625, 1.602783203125, 1.86865234375, 2.134521484375, 2.400390625, 2.666259765625, 2.93212890625, 3.197998046875, 3.4638671875, 3.729736328125, 3.99560546875, 4.261474609375, 4.52734375, 4.793212890625, 5.05908203125, 5.324951171875, 5.5908203125, 5.856689453125, 6.12255859375, 6.388427734375, 6.654296875, 6.920166015625, 7.18603515625, 7.451904296875, 7.7177734375, 7.983642578125, 8.24951171875, 8.515380859375, 8.78125]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 4.0, 6.0, 3.0, 6.0, 5.0, 10.0, 7.0, 14.0, 10.0, 12.0, 18.0, 17.0, 29.0, 18.0, 33.0, 40.0, 50.0, 114.0, 275.0, 815.0, 2726.0, 12968.0, 117933.0, 1744033.0, 2134721.0, 159468.0, 16060.0, 3242.0, 945.0, 308.0, 118.0, 49.0, 33.0, 32.0, 21.0, 26.0, 22.0, 18.0, 11.0, 11.0, 9.0, 5.0, 14.0, 6.0, 3.0, 9.0, 3.0, 2.0, 5.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.015625, -26.145751953125, -25.27587890625, -24.406005859375, -23.5361328125, -22.666259765625, -21.79638671875, -20.926513671875, -20.056640625, -19.186767578125, -18.31689453125, -17.447021484375, -16.5771484375, -15.707275390625, -14.83740234375, -13.967529296875, -13.09765625, -12.227783203125, -11.35791015625, -10.488037109375, -9.6181640625, -8.748291015625, -7.87841796875, -7.008544921875, -6.138671875, -5.268798828125, -4.39892578125, -3.529052734375, -2.6591796875, -1.789306640625, -0.91943359375, -0.049560546875, 0.8203125, 1.690185546875, 2.56005859375, 3.429931640625, 4.2998046875, 5.169677734375, 6.03955078125, 6.909423828125, 7.779296875, 8.649169921875, 9.51904296875, 10.388916015625, 11.2587890625, 12.128662109375, 12.99853515625, 13.868408203125, 14.73828125, 15.608154296875, 16.47802734375, 17.347900390625, 18.2177734375, 19.087646484375, 19.95751953125, 20.827392578125, 21.697265625, 22.567138671875, 23.43701171875, 24.306884765625, 25.1767578125, 26.046630859375, 26.91650390625, 27.786376953125, 28.65625]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 4.0, 5.0, 6.0, 13.0, 18.0, 22.0, 25.0, 33.0, 57.0, 83.0, 122.0, 139.0, 186.0, 246.0, 322.0, 431.0, 429.0, 398.0, 416.0, 306.0, 192.0, 161.0, 119.0, 102.0, 66.0, 44.0, 32.0, 32.0, 20.0, 16.0, 8.0, 5.0, 5.0, 5.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.625, -21.00146484375, -20.3779296875, -19.75439453125, -19.130859375, -18.50732421875, -17.8837890625, -17.26025390625, -16.63671875, -16.01318359375, -15.3896484375, -14.76611328125, -14.142578125, -13.51904296875, -12.8955078125, -12.27197265625, -11.6484375, -11.02490234375, -10.4013671875, -9.77783203125, -9.154296875, -8.53076171875, -7.9072265625, -7.28369140625, -6.66015625, -6.03662109375, -5.4130859375, -4.78955078125, -4.166015625, -3.54248046875, -2.9189453125, -2.29541015625, -1.671875, -1.04833984375, -0.4248046875, 0.19873046875, 0.822265625, 1.44580078125, 2.0693359375, 2.69287109375, 3.31640625, 3.93994140625, 4.5634765625, 5.18701171875, 5.810546875, 6.43408203125, 7.0576171875, 7.68115234375, 8.3046875, 8.92822265625, 9.5517578125, 10.17529296875, 10.798828125, 11.42236328125, 12.0458984375, 12.66943359375, 13.29296875, 13.91650390625, 14.5400390625, 15.16357421875, 15.787109375, 16.41064453125, 17.0341796875, 17.65771484375, 18.28125]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 3.0, 4.0, 5.0, 11.0, 14.0, 23.0, 27.0, 32.0, 52.0, 66.0, 102.0, 125.0, 148.0, 201.0, 342.0, 721.0, 3528.0, 66226.0, 3195418.0, 905865.0, 18228.0, 1648.0, 473.0, 274.0, 196.0, 154.0, 123.0, 87.0, 52.0, 40.0, 32.0, 17.0, 12.0, 11.0, 4.0, 10.0, 4.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.65625, -51.72705078125, -49.7978515625, -47.86865234375, -45.939453125, -44.01025390625, -42.0810546875, -40.15185546875, -38.22265625, -36.29345703125, -34.3642578125, -32.43505859375, -30.505859375, -28.57666015625, -26.6474609375, -24.71826171875, -22.7890625, -20.85986328125, -18.9306640625, -17.00146484375, -15.072265625, -13.14306640625, -11.2138671875, -9.28466796875, -7.35546875, -5.42626953125, -3.4970703125, -1.56787109375, 0.361328125, 2.29052734375, 4.2197265625, 6.14892578125, 8.078125, 10.00732421875, 11.9365234375, 13.86572265625, 15.794921875, 17.72412109375, 19.6533203125, 21.58251953125, 23.51171875, 25.44091796875, 27.3701171875, 29.29931640625, 31.228515625, 33.15771484375, 35.0869140625, 37.01611328125, 38.9453125, 40.87451171875, 42.8037109375, 44.73291015625, 46.662109375, 48.59130859375, 50.5205078125, 52.44970703125, 54.37890625, 56.30810546875, 58.2373046875, 60.16650390625, 62.095703125, 64.02490234375, 65.9541015625, 67.88330078125, 69.8125]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 8.0, 17.0, 40.0, 113.0, 166.0, 208.0, 195.0, 136.0, 88.0, 24.0, 14.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-262.7371826171875, -257.108154296875, -251.4791259765625, -245.85009765625, -240.2210693359375, -234.59202575683594, -228.96299743652344, -223.33396911621094, -217.70494079589844, -212.07591247558594, -206.44688415527344, -200.81785583496094, -195.18881225585938, -189.55978393554688, -183.93075561523438, -178.30172729492188, -172.67269897460938, -167.04367065429688, -161.41464233398438, -155.78561401367188, -150.15658569335938, -144.5275421142578, -138.8985137939453, -133.2694854736328, -127.64045715332031, -122.01142883300781, -116.38240051269531, -110.75336456298828, -105.12433624267578, -99.49530792236328, -93.86627197265625, -88.23724365234375, -82.60820770263672, -76.97917938232422, -71.35014343261719, -65.72111511230469, -60.09208679199219, -54.46305847167969, -48.83402633666992, -43.204994201660156, -37.575965881347656, -31.946935653686523, -26.31790542602539, -20.688875198364258, -15.059844970703125, -9.430814743041992, -3.8017845153808594, 1.8272476196289062, 7.456275939941406, 13.085306167602539, 18.714336395263672, 24.343366622924805, 29.972396850585938, 35.60142517089844, 41.2304573059082, 46.85948944091797, 52.48851776123047, 58.11754608154297, 63.746578216552734, 69.3756103515625, 75.004638671875, 80.6336669921875, 86.2626953125, 91.89173126220703, 97.52075958251953]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 4.0, 9.0, 5.0, 6.0, 8.0, 5.0, 16.0, 20.0, 17.0, 18.0, 23.0, 27.0, 35.0, 25.0, 30.0, 33.0, 40.0, 54.0, 49.0, 44.0, 50.0, 41.0, 38.0, 40.0, 35.0, 30.0, 46.0, 40.0, 30.0, 27.0, 27.0, 20.0, 23.0, 22.0, 14.0, 7.0, 14.0, 5.0, 6.0, 10.0, 4.0, 5.0, 2.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.99034118652344, -62.831356048583984, -60.672367095947266, -58.51338195800781, -56.354393005371094, -54.19540786743164, -52.03642272949219, -49.87743377685547, -47.71844482421875, -45.5594596862793, -43.40047073364258, -41.241485595703125, -39.082496643066406, -36.92351150512695, -34.7645263671875, -32.60553741455078, -30.446552276611328, -28.287565231323242, -26.128578186035156, -23.969593048095703, -21.810604095458984, -19.65161895751953, -17.492631912231445, -15.33364486694336, -13.174657821655273, -11.015670776367188, -8.856683731079102, -6.697697639465332, -4.538710594177246, -2.37972354888916, -0.22073745727539062, 1.9382495880126953, 4.097236633300781, 6.256223678588867, 8.415210723876953, 10.574196815490723, 12.733183860778809, 14.892170906066895, 17.051156997680664, 19.21014404296875, 21.369131088256836, 23.528118133544922, 25.687105178833008, 27.846092224121094, 30.005077362060547, 32.164066314697266, 34.32305145263672, 36.48204040527344, 38.64102554321289, 40.800010681152344, 42.95899963378906, 45.117984771728516, 47.276973724365234, 49.43595886230469, 51.594947814941406, 53.75393295288086, 55.91291809082031, 58.071903228759766, 60.230892181396484, 62.38987731933594, 64.54886627197266, 66.70785522460938, 68.86683654785156, 71.02582550048828, 73.184814453125]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 4.0, 1.0, 3.0, 1.0, 7.0, 3.0, 10.0, 9.0, 10.0, 10.0, 18.0, 19.0, 13.0, 20.0, 19.0, 21.0, 24.0, 27.0, 30.0, 42.0, 30.0, 35.0, 31.0, 35.0, 28.0, 46.0, 37.0, 33.0, 38.0, 32.0, 34.0, 25.0, 42.0, 26.0, 41.0, 27.0, 23.0, 24.0, 17.0, 18.0, 18.0, 16.0, 8.0, 15.0, 4.0, 2.0, 10.0, 3.0, 5.0, 3.0, 8.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-8.1015625, -7.8349609375, -7.568359375, -7.3017578125, -7.03515625, -6.7685546875, -6.501953125, -6.2353515625, -5.96875, -5.7021484375, -5.435546875, -5.1689453125, -4.90234375, -4.6357421875, -4.369140625, -4.1025390625, -3.8359375, -3.5693359375, -3.302734375, -3.0361328125, -2.76953125, -2.5029296875, -2.236328125, -1.9697265625, -1.703125, -1.4365234375, -1.169921875, -0.9033203125, -0.63671875, -0.3701171875, -0.103515625, 0.1630859375, 0.4296875, 0.6962890625, 0.962890625, 1.2294921875, 1.49609375, 1.7626953125, 2.029296875, 2.2958984375, 2.5625, 2.8291015625, 3.095703125, 3.3623046875, 3.62890625, 3.8955078125, 4.162109375, 4.4287109375, 4.6953125, 4.9619140625, 5.228515625, 5.4951171875, 5.76171875, 6.0283203125, 6.294921875, 6.5615234375, 6.828125, 7.0947265625, 7.361328125, 7.6279296875, 7.89453125, 8.1611328125, 8.427734375, 8.6943359375, 8.9609375]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 5.0, 6.0, 5.0, 6.0, 11.0, 33.0, 41.0, 57.0, 57.0, 106.0, 156.0, 254.0, 407.0, 630.0, 1076.0, 1651.0, 2737.0, 4418.0, 7490.0, 12448.0, 20325.0, 34498.0, 59206.0, 101788.0, 165370.0, 212646.0, 169393.0, 104408.0, 60702.0, 35552.0, 20985.0, 12668.0, 7487.0, 4485.0, 2776.0, 1736.0, 1107.0, 661.0, 402.0, 255.0, 179.0, 129.0, 71.0, 55.0, 28.0, 18.0, 10.0, 11.0, 11.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.96923828125, -0.9384918212890625, -0.907745361328125, -0.8769989013671875, -0.84625244140625, -0.8155059814453125, -0.784759521484375, -0.7540130615234375, -0.7232666015625, -0.6925201416015625, -0.661773681640625, -0.6310272216796875, -0.60028076171875, -0.5695343017578125, -0.538787841796875, -0.5080413818359375, -0.477294921875, -0.4465484619140625, -0.415802001953125, -0.3850555419921875, -0.35430908203125, -0.3235626220703125, -0.292816162109375, -0.2620697021484375, -0.2313232421875, -0.2005767822265625, -0.169830322265625, -0.1390838623046875, -0.10833740234375, -0.0775909423828125, -0.046844482421875, -0.0160980224609375, 0.0146484375, 0.0453948974609375, 0.076141357421875, 0.1068878173828125, 0.13763427734375, 0.1683807373046875, 0.199127197265625, 0.2298736572265625, 0.2606201171875, 0.2913665771484375, 0.322113037109375, 0.3528594970703125, 0.38360595703125, 0.4143524169921875, 0.445098876953125, 0.4758453369140625, 0.506591796875, 0.5373382568359375, 0.568084716796875, 0.5988311767578125, 0.62957763671875, 0.6603240966796875, 0.691070556640625, 0.7218170166015625, 0.7525634765625, 0.7833099365234375, 0.814056396484375, 0.8448028564453125, 0.87554931640625, 0.9062957763671875, 0.937042236328125, 0.9677886962890625, 0.99853515625]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 6.0, 7.0, 9.0, 5.0, 12.0, 13.0, 14.0, 14.0, 20.0, 26.0, 28.0, 33.0, 34.0, 37.0, 46.0, 53.0, 45.0, 38.0, 54.0, 1077.0, 36.0, 48.0, 46.0, 51.0, 37.0, 36.0, 44.0, 41.0, 21.0, 16.0, 18.0, 19.0, 11.0, 18.0, 2.0, 1.0, 2.0, 5.0, 7.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-8.4765625, -8.24749755859375, -8.0184326171875, -7.78936767578125, -7.560302734375, -7.33123779296875, -7.1021728515625, -6.87310791015625, -6.64404296875, -6.41497802734375, -6.1859130859375, -5.95684814453125, -5.727783203125, -5.49871826171875, -5.2696533203125, -5.04058837890625, -4.8115234375, -4.58245849609375, -4.3533935546875, -4.12432861328125, -3.895263671875, -3.66619873046875, -3.4371337890625, -3.20806884765625, -2.97900390625, -2.74993896484375, -2.5208740234375, -2.29180908203125, -2.062744140625, -1.83367919921875, -1.6046142578125, -1.37554931640625, -1.146484375, -0.91741943359375, -0.6883544921875, -0.45928955078125, -0.230224609375, -0.00115966796875, 0.2279052734375, 0.45697021484375, 0.68603515625, 0.91510009765625, 1.1441650390625, 1.37322998046875, 1.602294921875, 1.83135986328125, 2.0604248046875, 2.28948974609375, 2.5185546875, 2.74761962890625, 2.9766845703125, 3.20574951171875, 3.434814453125, 3.66387939453125, 3.8929443359375, 4.12200927734375, 4.35107421875, 4.58013916015625, 4.8092041015625, 5.03826904296875, 5.267333984375, 5.49639892578125, 5.7254638671875, 5.95452880859375, 6.18359375]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 2.0, 5.0, 1.0, 5.0, 7.0, 4.0, 8.0, 8.0, 17.0, 27.0, 37.0, 53.0, 89.0, 121.0, 191.0, 254.0, 369.0, 551.0, 863.0, 1302.0, 2022.0, 3080.0, 5006.0, 7722.0, 12212.0, 19147.0, 30556.0, 47118.0, 72884.0, 108763.0, 166501.0, 1181748.0, 147341.0, 101549.0, 67632.0, 43817.0, 27852.0, 17490.0, 11001.0, 7060.0, 4383.0, 2839.0, 1885.0, 1215.0, 738.0, 532.0, 335.0, 254.0, 164.0, 110.0, 86.0, 63.0, 34.0, 29.0, 27.0, 13.0, 8.0, 7.0, 5.0, 3.0, 0.0, 2.0, 1.0], "bins": [-0.54638671875, -0.5295257568359375, -0.512664794921875, -0.4958038330078125, -0.47894287109375, -0.4620819091796875, -0.445220947265625, -0.4283599853515625, -0.4114990234375, -0.3946380615234375, -0.377777099609375, -0.3609161376953125, -0.34405517578125, -0.3271942138671875, -0.310333251953125, -0.2934722900390625, -0.276611328125, -0.2597503662109375, -0.242889404296875, -0.2260284423828125, -0.20916748046875, -0.1923065185546875, -0.175445556640625, -0.1585845947265625, -0.1417236328125, -0.1248626708984375, -0.108001708984375, -0.0911407470703125, -0.07427978515625, -0.0574188232421875, -0.040557861328125, -0.0236968994140625, -0.0068359375, 0.0100250244140625, 0.026885986328125, 0.0437469482421875, 0.06060791015625, 0.0774688720703125, 0.094329833984375, 0.1111907958984375, 0.1280517578125, 0.1449127197265625, 0.161773681640625, 0.1786346435546875, 0.19549560546875, 0.2123565673828125, 0.229217529296875, 0.2460784912109375, 0.262939453125, 0.2798004150390625, 0.296661376953125, 0.3135223388671875, 0.33038330078125, 0.3472442626953125, 0.364105224609375, 0.3809661865234375, 0.3978271484375, 0.4146881103515625, 0.431549072265625, 0.4484100341796875, 0.46527099609375, 0.4821319580078125, 0.498992919921875, 0.5158538818359375, 0.53271484375]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 5.0, 1.0, 3.0, 6.0, 4.0, 10.0, 13.0, 7.0, 11.0, 19.0, 11.0, 24.0, 32.0, 34.0, 33.0, 42.0, 60.0, 78.0, 85.0, 94.0, 65.0, 53.0, 55.0, 44.0, 39.0, 31.0, 30.0, 24.0, 14.0, 14.0, 20.0, 10.0, 6.0, 6.0, 9.0, 3.0, 4.0, 3.0, 0.0, 3.0, 0.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.020721435546875, -0.020076513290405273, -0.019431591033935547, -0.01878666877746582, -0.018141746520996094, -0.017496824264526367, -0.01685190200805664, -0.016206979751586914, -0.015562057495117188, -0.014917135238647461, -0.014272212982177734, -0.013627290725708008, -0.012982368469238281, -0.012337446212768555, -0.011692523956298828, -0.011047601699829102, -0.010402679443359375, -0.009757757186889648, -0.009112834930419922, -0.008467912673950195, -0.007822990417480469, -0.007178068161010742, -0.006533145904541016, -0.005888223648071289, -0.0052433013916015625, -0.004598379135131836, -0.003953456878662109, -0.003308534622192383, -0.0026636123657226562, -0.0020186901092529297, -0.0013737678527832031, -0.0007288455963134766, -8.392333984375e-05, 0.0005609989166259766, 0.0012059211730957031, 0.0018508434295654297, 0.0024957656860351562, 0.003140687942504883, 0.0037856101989746094, 0.004430532455444336, 0.0050754547119140625, 0.005720376968383789, 0.006365299224853516, 0.007010221481323242, 0.007655143737792969, 0.008300065994262695, 0.008944988250732422, 0.009589910507202148, 0.010234832763671875, 0.010879755020141602, 0.011524677276611328, 0.012169599533081055, 0.012814521789550781, 0.013459444046020508, 0.014104366302490234, 0.014749288558959961, 0.015394210815429688, 0.016039133071899414, 0.01668405532836914, 0.017328977584838867, 0.017973899841308594, 0.01861882209777832, 0.019263744354248047, 0.019908666610717773, 0.0205535888671875]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 2.0, 0.0, 5.0, 6.0, 5.0, 5.0, 7.0, 11.0, 15.0, 15.0, 18.0, 18.0, 34.0, 46.0, 57.0, 73.0, 134.0, 199.0, 565.0, 7809.0, 760551.0, 273648.0, 4339.0, 443.0, 172.0, 113.0, 61.0, 57.0, 30.0, 25.0, 12.0, 20.0, 12.0, 13.0, 6.0, 9.0, 5.0, 5.0, 5.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.402099609375, -0.3894996643066406, -0.37689971923828125, -0.3642997741699219, -0.3516998291015625, -0.3390998840332031, -0.32649993896484375, -0.3138999938964844, -0.301300048828125, -0.2887001037597656, -0.27610015869140625, -0.2635002136230469, -0.2509002685546875, -0.23830032348632812, -0.22570037841796875, -0.21310043334960938, -0.20050048828125, -0.18790054321289062, -0.17530059814453125, -0.16270065307617188, -0.1501007080078125, -0.13750076293945312, -0.12490081787109375, -0.11230087280273438, -0.099700927734375, -0.08710098266601562, -0.07450103759765625, -0.061901092529296875, -0.0493011474609375, -0.036701202392578125, -0.02410125732421875, -0.011501312255859375, 0.0010986328125, 0.013698577880859375, 0.02629852294921875, 0.038898468017578125, 0.0514984130859375, 0.06409835815429688, 0.07669830322265625, 0.08929824829101562, 0.101898193359375, 0.11449813842773438, 0.12709808349609375, 0.13969802856445312, 0.1522979736328125, 0.16489791870117188, 0.17749786376953125, 0.19009780883789062, 0.20269775390625, 0.21529769897460938, 0.22789764404296875, 0.24049758911132812, 0.2530975341796875, 0.2656974792480469, 0.27829742431640625, 0.2908973693847656, 0.303497314453125, 0.3160972595214844, 0.32869720458984375, 0.3412971496582031, 0.3538970947265625, 0.3664970397949219, 0.37909698486328125, 0.3916969299316406, 0.404296875]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 13.0, 421.0, 553.0, 28.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04627005383372307, -0.03971001133322716, -0.03314996883273125, -0.026589928194880486, -0.020029885694384575, -0.013469845056533813, -0.006909802556037903, -0.0003497600555419922, 0.0062102824449539185, 0.012770324945449829, 0.01933036744594574, 0.0258904080837965, 0.03245045244693756, 0.03901049122214317, 0.045570533722639084, 0.052130576223134995, 0.058690618723630905, 0.06525065749883652, 0.07181069999933243, 0.07837074249982834, 0.08493078500032425, 0.09149082750082016, 0.09805087000131607, 0.10461091250181198, 0.11117095500230789, 0.1177309975028038, 0.12429104000329971, 0.13085107505321503, 0.13741111755371094, 0.14397116005420685, 0.15053120255470276, 0.15709124505519867, 0.16365130245685577, 0.17021134495735168, 0.1767713874578476, 0.1833314299583435, 0.18989147245883942, 0.19645151495933533, 0.20301155745983124, 0.20957159996032715, 0.21613164246082306, 0.22269168496131897, 0.22925172746181488, 0.2358117699623108, 0.2423718124628067, 0.2489318549633026, 0.25549188256263733, 0.26205193996429443, 0.26861196756362915, 0.27517199516296387, 0.28173205256462097, 0.2882920801639557, 0.2948521375656128, 0.3014121651649475, 0.3079722225666046, 0.31453225016593933, 0.32109230756759644, 0.32765233516693115, 0.33421239256858826, 0.340772420167923, 0.3473324775695801, 0.3538925051689148, 0.3604525625705719, 0.3670125901699066, 0.3735726475715637]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 7.0, 12.0, 19.0, 23.0, 21.0, 39.0, 48.0, 58.0, 67.0, 70.0, 74.0, 74.0, 66.0, 81.0, 64.0, 62.0, 61.0, 47.0, 29.0, 22.0, 21.0, 15.0, 15.0, 5.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.022348761558532715, -0.0216132253408432, -0.020877689123153687, -0.020142152905464172, -0.019406616687774658, -0.018671080470085144, -0.01793554425239563, -0.017200008034706116, -0.0164644718170166, -0.015728935599327087, -0.014993399381637573, -0.014257863163948059, -0.013522326946258545, -0.01278679072856903, -0.012051254510879517, -0.011315718293190002, -0.010580182075500488, -0.009844645857810974, -0.00910910964012146, -0.008373573422431946, -0.007638037204742432, -0.0069025009870529175, -0.006166964769363403, -0.005431428551673889, -0.004695892333984375, -0.003960356116294861, -0.0032248198986053467, -0.0024892836809158325, -0.0017537474632263184, -0.0010182112455368042, -0.00028267502784729004, 0.0004528611898422241, 0.0011883974075317383, 0.0019239336252212524, 0.0026594698429107666, 0.0033950060606002808, 0.004130542278289795, 0.004866078495979309, 0.005601614713668823, 0.006337150931358337, 0.0070726871490478516, 0.007808223366737366, 0.00854375958442688, 0.009279295802116394, 0.010014832019805908, 0.010750368237495422, 0.011485904455184937, 0.01222144067287445, 0.012956976890563965, 0.013692513108253479, 0.014428049325942993, 0.015163585543632507, 0.01589912176132202, 0.016634657979011536, 0.01737019419670105, 0.018105730414390564, 0.018841266632080078, 0.019576802849769592, 0.020312339067459106, 0.02104787528514862, 0.021783411502838135, 0.02251894772052765, 0.023254483938217163, 0.023990020155906677, 0.02472555637359619]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 4.0, 1.0, 3.0, 1.0, 7.0, 3.0, 10.0, 9.0, 10.0, 10.0, 18.0, 19.0, 13.0, 20.0, 19.0, 21.0, 24.0, 27.0, 30.0, 42.0, 30.0, 35.0, 31.0, 35.0, 28.0, 46.0, 37.0, 33.0, 38.0, 32.0, 34.0, 25.0, 42.0, 26.0, 40.0, 28.0, 23.0, 24.0, 17.0, 18.0, 18.0, 16.0, 8.0, 15.0, 4.0, 2.0, 10.0, 3.0, 5.0, 3.0, 8.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-8.1015625, -7.8349609375, -7.568359375, -7.3017578125, -7.03515625, -6.7685546875, -6.501953125, -6.2353515625, -5.96875, -5.7021484375, -5.435546875, -5.1689453125, -4.90234375, -4.6357421875, -4.369140625, -4.1025390625, -3.8359375, -3.5693359375, -3.302734375, -3.0361328125, -2.76953125, -2.5029296875, -2.236328125, -1.9697265625, -1.703125, -1.4365234375, -1.169921875, -0.9033203125, -0.63671875, -0.3701171875, -0.103515625, 0.1630859375, 0.4296875, 0.6962890625, 0.962890625, 1.2294921875, 1.49609375, 1.7626953125, 2.029296875, 2.2958984375, 2.5625, 2.8291015625, 3.095703125, 3.3623046875, 3.62890625, 3.8955078125, 4.162109375, 4.4287109375, 4.6953125, 4.9619140625, 5.228515625, 5.4951171875, 5.76171875, 6.0283203125, 6.294921875, 6.5615234375, 6.828125, 7.0947265625, 7.361328125, 7.6279296875, 7.89453125, 8.1611328125, 8.427734375, 8.6943359375, 8.9609375]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 2.0, 10.0, 17.0, 31.0, 40.0, 57.0, 76.0, 128.0, 182.0, 298.0, 479.0, 698.0, 1030.0, 1630.0, 2514.0, 3828.0, 5982.0, 9958.0, 18158.0, 37693.0, 103855.0, 346164.0, 333539.0, 101235.0, 36626.0, 17593.0, 9841.0, 5990.0, 3798.0, 2475.0, 1572.0, 1027.0, 664.0, 494.0, 279.0, 200.0, 128.0, 81.0, 65.0, 38.0, 21.0, 20.0, 13.0, 14.0, 7.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.06640625, -6.83074951171875, -6.5950927734375, -6.35943603515625, -6.123779296875, -5.88812255859375, -5.6524658203125, -5.41680908203125, -5.18115234375, -4.94549560546875, -4.7098388671875, -4.47418212890625, -4.238525390625, -4.00286865234375, -3.7672119140625, -3.53155517578125, -3.2958984375, -3.06024169921875, -2.8245849609375, -2.58892822265625, -2.353271484375, -2.11761474609375, -1.8819580078125, -1.64630126953125, -1.41064453125, -1.17498779296875, -0.9393310546875, -0.70367431640625, -0.468017578125, -0.23236083984375, 0.0032958984375, 0.23895263671875, 0.474609375, 0.71026611328125, 0.9459228515625, 1.18157958984375, 1.417236328125, 1.65289306640625, 1.8885498046875, 2.12420654296875, 2.35986328125, 2.59552001953125, 2.8311767578125, 3.06683349609375, 3.302490234375, 3.53814697265625, 3.7738037109375, 4.00946044921875, 4.2451171875, 4.48077392578125, 4.7164306640625, 4.95208740234375, 5.187744140625, 5.42340087890625, 5.6590576171875, 5.89471435546875, 6.13037109375, 6.36602783203125, 6.6016845703125, 6.83734130859375, 7.072998046875, 7.30865478515625, 7.5443115234375, 7.77996826171875, 8.015625]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 7.0, 7.0, 12.0, 6.0, 6.0, 17.0, 18.0, 17.0, 24.0, 25.0, 42.0, 37.0, 34.0, 39.0, 65.0, 67.0, 90.0, 143.0, 1631.0, 272.0, 81.0, 60.0, 46.0, 53.0, 32.0, 30.0, 30.0, 27.0, 28.0, 26.0, 19.0, 13.0, 12.0, 9.0, 7.0, 7.0, 4.0, 6.0, 7.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-43.40625, -42.28369140625, -41.1611328125, -40.03857421875, -38.916015625, -37.79345703125, -36.6708984375, -35.54833984375, -34.42578125, -33.30322265625, -32.1806640625, -31.05810546875, -29.935546875, -28.81298828125, -27.6904296875, -26.56787109375, -25.4453125, -24.32275390625, -23.2001953125, -22.07763671875, -20.955078125, -19.83251953125, -18.7099609375, -17.58740234375, -16.46484375, -15.34228515625, -14.2197265625, -13.09716796875, -11.974609375, -10.85205078125, -9.7294921875, -8.60693359375, -7.484375, -6.36181640625, -5.2392578125, -4.11669921875, -2.994140625, -1.87158203125, -0.7490234375, 0.37353515625, 1.49609375, 2.61865234375, 3.7412109375, 4.86376953125, 5.986328125, 7.10888671875, 8.2314453125, 9.35400390625, 10.4765625, 11.59912109375, 12.7216796875, 13.84423828125, 14.966796875, 16.08935546875, 17.2119140625, 18.33447265625, 19.45703125, 20.57958984375, 21.7021484375, 22.82470703125, 23.947265625, 25.06982421875, 26.1923828125, 27.31494140625, 28.4375]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 6.0, 7.0, 12.0, 16.0, 23.0, 28.0, 53.0, 63.0, 112.0, 166.0, 232.0, 418.0, 1020.0, 76257.0, 3062770.0, 3077.0, 524.0, 286.0, 193.0, 141.0, 64.0, 79.0, 30.0, 42.0, 23.0, 15.0, 8.0, 8.0, 6.0, 2.0, 6.0, 4.0, 6.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-116.4375, -112.5830078125, -108.728515625, -104.8740234375, -101.01953125, -97.1650390625, -93.310546875, -89.4560546875, -85.6015625, -81.7470703125, -77.892578125, -74.0380859375, -70.18359375, -66.3291015625, -62.474609375, -58.6201171875, -54.765625, -50.9111328125, -47.056640625, -43.2021484375, -39.34765625, -35.4931640625, -31.638671875, -27.7841796875, -23.9296875, -20.0751953125, -16.220703125, -12.3662109375, -8.51171875, -4.6572265625, -0.802734375, 3.0517578125, 6.90625, 10.7607421875, 14.615234375, 18.4697265625, 22.32421875, 26.1787109375, 30.033203125, 33.8876953125, 37.7421875, 41.5966796875, 45.451171875, 49.3056640625, 53.16015625, 57.0146484375, 60.869140625, 64.7236328125, 68.578125, 72.4326171875, 76.287109375, 80.1416015625, 83.99609375, 87.8505859375, 91.705078125, 95.5595703125, 99.4140625, 103.2685546875, 107.123046875, 110.9775390625, 114.83203125, 118.6865234375, 122.541015625, 126.3955078125, 130.25]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [9.0, 969.0, 42.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.82015037536621, -10.790372848510742, 7.239404678344727, 25.269182205200195, 43.29895782470703, 61.3287353515625, 79.35851287841797, 97.38829040527344, 115.4180679321289, 133.44784545898438, 151.47763061523438, 169.5074005126953, 187.53717041015625, 205.56695556640625, 223.59674072265625, 241.6265106201172, 259.6562805175781, 277.6860656738281, 295.7158203125, 313.74560546875, 331.775390625, 349.80517578125, 367.8349609375, 385.8647155761719, 403.8945007324219, 421.9242858886719, 439.95404052734375, 457.98382568359375, 476.01361083984375, 494.04339599609375, 512.0731811523438, 530.1029663085938, 548.1326904296875, 566.1624755859375, 584.1922607421875, 602.2220458984375, 620.2518310546875, 638.2815551757812, 656.3113403320312, 674.3411254882812, 692.3709106445312, 710.4006958007812, 728.4304809570312, 746.4602661132812, 764.489990234375, 782.519775390625, 800.549560546875, 818.579345703125, 836.609130859375, 854.638916015625, 872.668701171875, 890.698486328125, 908.728271484375, 926.7579956054688, 944.7877807617188, 962.8175659179688, 980.8473510742188, 998.8771362304688, 1016.9069213867188, 1034.9366455078125, 1052.9664306640625, 1070.9962158203125, 1089.0260009765625, 1107.0557861328125, 1125.0855712890625]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 4.0, 2.0, 2.0, 11.0, 6.0, 8.0, 10.0, 7.0, 22.0, 19.0, 24.0, 16.0, 16.0, 25.0, 29.0, 33.0, 35.0, 31.0, 31.0, 42.0, 45.0, 43.0, 34.0, 39.0, 43.0, 56.0, 38.0, 38.0, 36.0, 28.0, 21.0, 31.0, 32.0, 22.0, 16.0, 15.0, 12.0, 13.0, 13.0, 8.0, 8.0, 3.0, 8.0, 7.0, 5.0, 5.0, 2.0, 6.0, 5.0, 3.0, 1.0, 1.0, 2.0], "bins": [-89.05794525146484, -86.40727996826172, -83.75660705566406, -81.10594177246094, -78.45527648925781, -75.80461120605469, -73.15394592285156, -70.5032730102539, -67.85260772705078, -65.20194244384766, -62.551273345947266, -59.900604248046875, -57.24993896484375, -54.599273681640625, -51.948604583740234, -49.297935485839844, -46.64727020263672, -43.996604919433594, -41.3459358215332, -38.69526672363281, -36.04460144042969, -33.39393615722656, -30.743267059326172, -28.092599868774414, -25.441932678222656, -22.7912654876709, -20.14059829711914, -17.489931106567383, -14.839263916015625, -12.188596725463867, -9.53792953491211, -6.887262344360352, -4.2365875244140625, -1.5859203338623047, 1.0647468566894531, 3.715414047241211, 6.366081237792969, 9.016748428344727, 11.667415618896484, 14.318082809448242, 16.96875, 19.619417190551758, 22.270084381103516, 24.920751571655273, 27.57141876220703, 30.22208595275879, 32.87275314331055, 35.52342224121094, 38.17408752441406, 40.82475280761719, 43.47542190551758, 46.12609100341797, 48.776756286621094, 51.42742156982422, 54.07809066772461, 56.728759765625, 59.379425048828125, 62.03009033203125, 64.68075561523438, 67.33142852783203, 69.98209381103516, 72.63275909423828, 75.28343200683594, 77.93409729003906, 80.58476257324219]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 3.0, 6.0, 4.0, 9.0, 5.0, 12.0, 7.0, 9.0, 7.0, 21.0, 13.0, 18.0, 31.0, 28.0, 31.0, 28.0, 31.0, 35.0, 29.0, 37.0, 28.0, 34.0, 44.0, 40.0, 34.0, 32.0, 37.0, 37.0, 25.0, 37.0, 44.0, 29.0, 27.0, 24.0, 26.0, 24.0, 16.0, 12.0, 19.0, 17.0, 13.0, 9.0, 7.0, 6.0, 1.0, 1.0, 5.0, 3.0, 3.0, 4.0, 6.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.6796875, -8.3896484375, -8.099609375, -7.8095703125, -7.51953125, -7.2294921875, -6.939453125, -6.6494140625, -6.359375, -6.0693359375, -5.779296875, -5.4892578125, -5.19921875, -4.9091796875, -4.619140625, -4.3291015625, -4.0390625, -3.7490234375, -3.458984375, -3.1689453125, -2.87890625, -2.5888671875, -2.298828125, -2.0087890625, -1.71875, -1.4287109375, -1.138671875, -0.8486328125, -0.55859375, -0.2685546875, 0.021484375, 0.3115234375, 0.6015625, 0.8916015625, 1.181640625, 1.4716796875, 1.76171875, 2.0517578125, 2.341796875, 2.6318359375, 2.921875, 3.2119140625, 3.501953125, 3.7919921875, 4.08203125, 4.3720703125, 4.662109375, 4.9521484375, 5.2421875, 5.5322265625, 5.822265625, 6.1123046875, 6.40234375, 6.6923828125, 6.982421875, 7.2724609375, 7.5625, 7.8525390625, 8.142578125, 8.4326171875, 8.72265625, 9.0126953125, 9.302734375, 9.5927734375, 9.8828125]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 5.0, 7.0, 4.0, 4.0, 8.0, 6.0, 8.0, 10.0, 17.0, 23.0, 21.0, 42.0, 40.0, 63.0, 109.0, 190.0, 399.0, 930.0, 2347.0, 7610.0, 32234.0, 214682.0, 1426774.0, 2031459.0, 405066.0, 55017.0, 11390.0, 3333.0, 1250.0, 523.0, 260.0, 141.0, 84.0, 63.0, 37.0, 24.0, 22.0, 14.0, 21.0, 16.0, 12.0, 7.0, 3.0, 1.0, 5.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-18.390625, -17.78076171875, -17.1708984375, -16.56103515625, -15.951171875, -15.34130859375, -14.7314453125, -14.12158203125, -13.51171875, -12.90185546875, -12.2919921875, -11.68212890625, -11.072265625, -10.46240234375, -9.8525390625, -9.24267578125, -8.6328125, -8.02294921875, -7.4130859375, -6.80322265625, -6.193359375, -5.58349609375, -4.9736328125, -4.36376953125, -3.75390625, -3.14404296875, -2.5341796875, -1.92431640625, -1.314453125, -0.70458984375, -0.0947265625, 0.51513671875, 1.125, 1.73486328125, 2.3447265625, 2.95458984375, 3.564453125, 4.17431640625, 4.7841796875, 5.39404296875, 6.00390625, 6.61376953125, 7.2236328125, 7.83349609375, 8.443359375, 9.05322265625, 9.6630859375, 10.27294921875, 10.8828125, 11.49267578125, 12.1025390625, 12.71240234375, 13.322265625, 13.93212890625, 14.5419921875, 15.15185546875, 15.76171875, 16.37158203125, 16.9814453125, 17.59130859375, 18.201171875, 18.81103515625, 19.4208984375, 20.03076171875, 20.640625]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 4.0, 9.0, 20.0, 25.0, 38.0, 63.0, 100.0, 149.0, 250.0, 408.0, 585.0, 741.0, 610.0, 433.0, 248.0, 151.0, 92.0, 66.0, 31.0, 19.0, 16.0, 10.0, 7.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.6875, -16.7314453125, -15.775390625, -14.8193359375, -13.86328125, -12.9072265625, -11.951171875, -10.9951171875, -10.0390625, -9.0830078125, -8.126953125, -7.1708984375, -6.21484375, -5.2587890625, -4.302734375, -3.3466796875, -2.390625, -1.4345703125, -0.478515625, 0.4775390625, 1.43359375, 2.3896484375, 3.345703125, 4.3017578125, 5.2578125, 6.2138671875, 7.169921875, 8.1259765625, 9.08203125, 10.0380859375, 10.994140625, 11.9501953125, 12.90625, 13.8623046875, 14.818359375, 15.7744140625, 16.73046875, 17.6865234375, 18.642578125, 19.5986328125, 20.5546875, 21.5107421875, 22.466796875, 23.4228515625, 24.37890625, 25.3349609375, 26.291015625, 27.2470703125, 28.203125, 29.1591796875, 30.115234375, 31.0712890625, 32.02734375, 32.9833984375, 33.939453125, 34.8955078125, 35.8515625, 36.8076171875, 37.763671875, 38.7197265625, 39.67578125, 40.6318359375, 41.587890625, 42.5439453125, 43.5]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 7.0, 13.0, 19.0, 19.0, 41.0, 56.0, 77.0, 146.0, 204.0, 342.0, 618.0, 2055.0, 104236.0, 3996510.0, 86423.0, 1933.0, 620.0, 343.0, 224.0, 128.0, 96.0, 71.0, 38.0, 33.0, 12.0, 7.0, 6.0, 7.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-116.0, -113.26953125, -110.5390625, -107.80859375, -105.078125, -102.34765625, -99.6171875, -96.88671875, -94.15625, -91.42578125, -88.6953125, -85.96484375, -83.234375, -80.50390625, -77.7734375, -75.04296875, -72.3125, -69.58203125, -66.8515625, -64.12109375, -61.390625, -58.66015625, -55.9296875, -53.19921875, -50.46875, -47.73828125, -45.0078125, -42.27734375, -39.546875, -36.81640625, -34.0859375, -31.35546875, -28.625, -25.89453125, -23.1640625, -20.43359375, -17.703125, -14.97265625, -12.2421875, -9.51171875, -6.78125, -4.05078125, -1.3203125, 1.41015625, 4.140625, 6.87109375, 9.6015625, 12.33203125, 15.0625, 17.79296875, 20.5234375, 23.25390625, 25.984375, 28.71484375, 31.4453125, 34.17578125, 36.90625, 39.63671875, 42.3671875, 45.09765625, 47.828125, 50.55859375, 53.2890625, 56.01953125, 58.75]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 20.0, 66.0, 120.0, 183.0, 241.0, 186.0, 120.0, 50.0, 16.0, 8.0, 2.0, 1.0], "bins": [-347.1307678222656, -340.98828125, -334.84576416015625, -328.7032775878906, -322.560791015625, -316.41827392578125, -310.2757873535156, -304.1332702636719, -297.99078369140625, -291.8482971191406, -285.7057800292969, -279.56329345703125, -273.4207763671875, -267.2782897949219, -261.13580322265625, -254.99330139160156, -248.85079956054688, -242.7082977294922, -236.5657958984375, -230.42330932617188, -224.2808074951172, -218.1383056640625, -211.99581909179688, -205.8533172607422, -199.7108154296875, -193.5683135986328, -187.42581176757812, -181.2833251953125, -175.1408233642578, -168.99832153320312, -162.8558349609375, -156.7133331298828, -150.57083129882812, -144.42832946777344, -138.28582763671875, -132.14334106445312, -126.00083923339844, -119.85833740234375, -113.7158432006836, -107.57334899902344, -101.43085479736328, -95.28836059570312, -89.14585876464844, -83.00335693359375, -76.8608627319336, -70.71836853027344, -64.57586669921875, -58.43336868286133, -52.290870666503906, -46.148372650146484, -40.00587463378906, -33.86337661743164, -27.72087860107422, -21.578380584716797, -15.435882568359375, -9.293384552001953, -3.1508865356445312, 2.9916114807128906, 9.134109497070312, 15.276607513427734, 21.419105529785156, 27.561603546142578, 33.7041015625, 39.84659957885742, 45.989097595214844]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 1.0, 6.0, 10.0, 10.0, 5.0, 20.0, 13.0, 10.0, 14.0, 17.0, 24.0, 28.0, 30.0, 29.0, 22.0, 37.0, 22.0, 41.0, 38.0, 39.0, 43.0, 43.0, 51.0, 48.0, 31.0, 38.0, 23.0, 41.0, 41.0, 26.0, 22.0, 21.0, 19.0, 31.0, 12.0, 12.0, 13.0, 13.0, 12.0, 11.0, 6.0, 8.0, 7.0, 4.0, 4.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.06024169921875, -52.16075134277344, -50.26126480102539, -48.361778259277344, -46.46228790283203, -44.56279754638672, -42.66331100463867, -40.763824462890625, -38.86433410644531, -36.96484375, -35.06535720825195, -33.165870666503906, -31.266380310058594, -29.366891860961914, -27.467403411865234, -25.567914962768555, -23.668426513671875, -21.768938064575195, -19.869449615478516, -17.969961166381836, -16.070472717285156, -14.170984268188477, -12.271495819091797, -10.372007369995117, -8.472518920898438, -6.573030471801758, -4.673542022705078, -2.7740535736083984, -0.8745651245117188, 1.024923324584961, 2.9244117736816406, 4.82390022277832, 6.723388671875, 8.62287712097168, 10.52236557006836, 12.421854019165039, 14.321342468261719, 16.2208309173584, 18.120319366455078, 20.019807815551758, 21.919296264648438, 23.818784713745117, 25.718273162841797, 27.617761611938477, 29.517250061035156, 31.416738510131836, 33.316226959228516, 35.21571350097656, 37.115203857421875, 39.01469421386719, 40.914180755615234, 42.81366729736328, 44.713157653808594, 46.612648010253906, 48.51213455200195, 50.41162109375, 52.31111145019531, 54.210601806640625, 56.11008834838867, 58.00957489013672, 59.90906524658203, 61.808555603027344, 63.70804214477539, 65.60752868652344, 67.50701904296875]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 8.0, 2.0, 4.0, 4.0, 5.0, 9.0, 13.0, 11.0, 17.0, 11.0, 20.0, 18.0, 19.0, 27.0, 21.0, 25.0, 33.0, 28.0, 32.0, 45.0, 42.0, 37.0, 30.0, 29.0, 39.0, 42.0, 36.0, 31.0, 33.0, 40.0, 34.0, 35.0, 37.0, 23.0, 30.0, 11.0, 24.0, 18.0, 17.0, 15.0, 8.0, 9.0, 8.0, 7.0, 4.0, 8.0, 5.0, 3.0, 1.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-8.890625, -8.606201171875, -8.32177734375, -8.037353515625, -7.7529296875, -7.468505859375, -7.18408203125, -6.899658203125, -6.615234375, -6.330810546875, -6.04638671875, -5.761962890625, -5.4775390625, -5.193115234375, -4.90869140625, -4.624267578125, -4.33984375, -4.055419921875, -3.77099609375, -3.486572265625, -3.2021484375, -2.917724609375, -2.63330078125, -2.348876953125, -2.064453125, -1.780029296875, -1.49560546875, -1.211181640625, -0.9267578125, -0.642333984375, -0.35791015625, -0.073486328125, 0.2109375, 0.495361328125, 0.77978515625, 1.064208984375, 1.3486328125, 1.633056640625, 1.91748046875, 2.201904296875, 2.486328125, 2.770751953125, 3.05517578125, 3.339599609375, 3.6240234375, 3.908447265625, 4.19287109375, 4.477294921875, 4.76171875, 5.046142578125, 5.33056640625, 5.614990234375, 5.8994140625, 6.183837890625, 6.46826171875, 6.752685546875, 7.037109375, 7.321533203125, 7.60595703125, 7.890380859375, 8.1748046875, 8.459228515625, 8.74365234375, 9.028076171875, 9.3125]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 9.0, 8.0, 17.0, 25.0, 39.0, 65.0, 79.0, 141.0, 210.0, 313.0, 540.0, 853.0, 1401.0, 2188.0, 3448.0, 5803.0, 9527.0, 15555.0, 26664.0, 45234.0, 77592.0, 130144.0, 195933.0, 199420.0, 135213.0, 81070.0, 47506.0, 27680.0, 16526.0, 9657.0, 5976.0, 3650.0, 2299.0, 1376.0, 874.0, 559.0, 363.0, 208.0, 141.0, 87.0, 69.0, 32.0, 27.0, 16.0, 10.0, 9.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.92431640625, -0.8935470581054688, -0.8627777099609375, -0.8320083618164062, -0.801239013671875, -0.7704696655273438, -0.7397003173828125, -0.7089309692382812, -0.67816162109375, -0.6473922729492188, -0.6166229248046875, -0.5858535766601562, -0.555084228515625, -0.5243148803710938, -0.4935455322265625, -0.46277618408203125, -0.4320068359375, -0.40123748779296875, -0.3704681396484375, -0.33969879150390625, -0.308929443359375, -0.27816009521484375, -0.2473907470703125, -0.21662139892578125, -0.18585205078125, -0.15508270263671875, -0.1243133544921875, -0.09354400634765625, -0.062774658203125, -0.03200531005859375, -0.0012359619140625, 0.02953338623046875, 0.060302734375, 0.09107208251953125, 0.1218414306640625, 0.15261077880859375, 0.183380126953125, 0.21414947509765625, 0.2449188232421875, 0.27568817138671875, 0.30645751953125, 0.33722686767578125, 0.3679962158203125, 0.39876556396484375, 0.429534912109375, 0.46030426025390625, 0.4910736083984375, 0.5218429565429688, 0.5526123046875, 0.5833816528320312, 0.6141510009765625, 0.6449203491210938, 0.675689697265625, 0.7064590454101562, 0.7372283935546875, 0.7679977416992188, 0.79876708984375, 0.8295364379882812, 0.8603057861328125, 0.8910751342773438, 0.921844482421875, 0.9526138305664062, 0.9833831787109375, 1.0141525268554688, 1.044921875]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 6.0, 11.0, 13.0, 10.0, 7.0, 17.0, 20.0, 15.0, 24.0, 19.0, 22.0, 25.0, 33.0, 17.0, 43.0, 41.0, 31.0, 30.0, 52.0, 42.0, 1060.0, 38.0, 37.0, 31.0, 44.0, 37.0, 34.0, 37.0, 29.0, 25.0, 27.0, 22.0, 18.0, 24.0, 12.0, 13.0, 22.0, 4.0, 7.0, 3.0, 6.0, 4.0, 4.0, 4.0, 1.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.0078125, -5.8194580078125, -5.631103515625, -5.4427490234375, -5.25439453125, -5.0660400390625, -4.877685546875, -4.6893310546875, -4.5009765625, -4.3126220703125, -4.124267578125, -3.9359130859375, -3.74755859375, -3.5592041015625, -3.370849609375, -3.1824951171875, -2.994140625, -2.8057861328125, -2.617431640625, -2.4290771484375, -2.24072265625, -2.0523681640625, -1.864013671875, -1.6756591796875, -1.4873046875, -1.2989501953125, -1.110595703125, -0.9222412109375, -0.73388671875, -0.5455322265625, -0.357177734375, -0.1688232421875, 0.01953125, 0.2078857421875, 0.396240234375, 0.5845947265625, 0.77294921875, 0.9613037109375, 1.149658203125, 1.3380126953125, 1.5263671875, 1.7147216796875, 1.903076171875, 2.0914306640625, 2.27978515625, 2.4681396484375, 2.656494140625, 2.8448486328125, 3.033203125, 3.2215576171875, 3.409912109375, 3.5982666015625, 3.78662109375, 3.9749755859375, 4.163330078125, 4.3516845703125, 4.5400390625, 4.7283935546875, 4.916748046875, 5.1051025390625, 5.29345703125, 5.4818115234375, 5.670166015625, 5.8585205078125, 6.046875]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 7.0, 8.0, 19.0, 20.0, 30.0, 43.0, 83.0, 113.0, 218.0, 326.0, 502.0, 770.0, 1243.0, 2092.0, 3527.0, 6084.0, 10395.0, 18450.0, 32373.0, 57659.0, 99069.0, 162468.0, 1204434.0, 211875.0, 119944.0, 71528.0, 40323.0, 22927.0, 12653.0, 7287.0, 4193.0, 2539.0, 1423.0, 927.0, 582.0, 347.0, 203.0, 142.0, 118.0, 55.0, 39.0, 38.0, 19.0, 18.0, 8.0, 6.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.68603515625, -0.6643829345703125, -0.642730712890625, -0.6210784912109375, -0.59942626953125, -0.5777740478515625, -0.556121826171875, -0.5344696044921875, -0.5128173828125, -0.4911651611328125, -0.469512939453125, -0.4478607177734375, -0.42620849609375, -0.4045562744140625, -0.382904052734375, -0.3612518310546875, -0.339599609375, -0.3179473876953125, -0.296295166015625, -0.2746429443359375, -0.25299072265625, -0.2313385009765625, -0.209686279296875, -0.1880340576171875, -0.1663818359375, -0.1447296142578125, -0.123077392578125, -0.1014251708984375, -0.07977294921875, -0.0581207275390625, -0.036468505859375, -0.0148162841796875, 0.0068359375, 0.0284881591796875, 0.050140380859375, 0.0717926025390625, 0.09344482421875, 0.1150970458984375, 0.136749267578125, 0.1584014892578125, 0.1800537109375, 0.2017059326171875, 0.223358154296875, 0.2450103759765625, 0.26666259765625, 0.2883148193359375, 0.309967041015625, 0.3316192626953125, 0.353271484375, 0.3749237060546875, 0.396575927734375, 0.4182281494140625, 0.43988037109375, 0.4615325927734375, 0.483184814453125, 0.5048370361328125, 0.5264892578125, 0.5481414794921875, 0.569793701171875, 0.5914459228515625, 0.61309814453125, 0.6347503662109375, 0.656402587890625, 0.6780548095703125, 0.69970703125]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 2.0, 1.0, 3.0, 7.0, 4.0, 6.0, 8.0, 4.0, 4.0, 6.0, 9.0, 8.0, 9.0, 16.0, 15.0, 17.0, 23.0, 24.0, 28.0, 40.0, 58.0, 74.0, 117.0, 106.0, 80.0, 64.0, 50.0, 32.0, 37.0, 22.0, 16.0, 12.0, 11.0, 11.0, 13.0, 7.0, 8.0, 9.0, 6.0, 5.0, 5.0, 9.0, 6.0, 3.0, 5.0, 5.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.032501220703125, -0.03148984909057617, -0.030478477478027344, -0.029467105865478516, -0.028455734252929688, -0.02744436264038086, -0.02643299102783203, -0.025421619415283203, -0.024410247802734375, -0.023398876190185547, -0.02238750457763672, -0.02137613296508789, -0.020364761352539062, -0.019353389739990234, -0.018342018127441406, -0.017330646514892578, -0.01631927490234375, -0.015307903289794922, -0.014296531677246094, -0.013285160064697266, -0.012273788452148438, -0.01126241683959961, -0.010251045227050781, -0.009239673614501953, -0.008228302001953125, -0.007216930389404297, -0.006205558776855469, -0.005194187164306641, -0.0041828155517578125, -0.0031714439392089844, -0.0021600723266601562, -0.0011487007141113281, -0.0001373291015625, 0.0008740425109863281, 0.0018854141235351562, 0.0028967857360839844, 0.0039081573486328125, 0.004919528961181641, 0.005930900573730469, 0.006942272186279297, 0.007953643798828125, 0.008965015411376953, 0.009976387023925781, 0.01098775863647461, 0.011999130249023438, 0.013010501861572266, 0.014021873474121094, 0.015033245086669922, 0.01604461669921875, 0.017055988311767578, 0.018067359924316406, 0.019078731536865234, 0.020090103149414062, 0.02110147476196289, 0.02211284637451172, 0.023124217987060547, 0.024135589599609375, 0.025146961212158203, 0.02615833282470703, 0.02716970443725586, 0.028181076049804688, 0.029192447662353516, 0.030203819274902344, 0.031215190887451172, 0.0322265625]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 1.0, 7.0, 3.0, 5.0, 6.0, 10.0, 8.0, 4.0, 14.0, 14.0, 18.0, 23.0, 18.0, 22.0, 29.0, 22.0, 50.0, 73.0, 154.0, 234.0, 473.0, 3969.0, 949634.0, 91753.0, 1118.0, 328.0, 191.0, 107.0, 60.0, 38.0, 22.0, 28.0, 19.0, 24.0, 15.0, 11.0, 7.0, 7.0, 9.0, 3.0, 6.0, 5.0, 5.0, 2.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.65625, -0.6362380981445312, -0.6162261962890625, -0.5962142944335938, -0.576202392578125, -0.5561904907226562, -0.5361785888671875, -0.5161666870117188, -0.49615478515625, -0.47614288330078125, -0.4561309814453125, -0.43611907958984375, -0.416107177734375, -0.39609527587890625, -0.3760833740234375, -0.35607147216796875, -0.3360595703125, -0.31604766845703125, -0.2960357666015625, -0.27602386474609375, -0.256011962890625, -0.23600006103515625, -0.2159881591796875, -0.19597625732421875, -0.17596435546875, -0.15595245361328125, -0.1359405517578125, -0.11592864990234375, -0.095916748046875, -0.07590484619140625, -0.0558929443359375, -0.03588104248046875, -0.015869140625, 0.00414276123046875, 0.0241546630859375, 0.04416656494140625, 0.064178466796875, 0.08419036865234375, 0.1042022705078125, 0.12421417236328125, 0.14422607421875, 0.16423797607421875, 0.1842498779296875, 0.20426177978515625, 0.224273681640625, 0.24428558349609375, 0.2642974853515625, 0.28430938720703125, 0.3043212890625, 0.32433319091796875, 0.3443450927734375, 0.36435699462890625, 0.384368896484375, 0.40438079833984375, 0.4243927001953125, 0.44440460205078125, 0.46441650390625, 0.48442840576171875, 0.5044403076171875, 0.5244522094726562, 0.544464111328125, 0.5644760131835938, 0.5844879150390625, 0.6044998168945312, 0.62451171875]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [956.0, 59.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.011058940552175045, 0.004542824812233448, 0.020144589245319366, 0.03574635460972786, 0.05134811997413635, 0.06694988906383514, 0.08255165070295334, 0.09815341234207153, 0.11375518143177032, 0.12935695052146912, 0.1449587047100067, 0.1605604737997055, 0.1761622428894043, 0.1917640119791031, 0.20736578106880188, 0.22296753525733948, 0.23856930434703827, 0.25417107343673706, 0.26977282762527466, 0.28537461161613464, 0.30097636580467224, 0.3165781497955322, 0.3321799039840698, 0.3477816581726074, 0.3633834421634674, 0.378985196352005, 0.394586980342865, 0.4101887345314026, 0.4257904887199402, 0.44139227271080017, 0.45699402689933777, 0.47259581089019775, 0.48819756507873535, 0.503799319267273, 0.5194010734558105, 0.5350028872489929, 0.5506046414375305, 0.5662063956260681, 0.5818081498146057, 0.5974099040031433, 0.6130117177963257, 0.6286134719848633, 0.6442152261734009, 0.6598170399665833, 0.6754187941551208, 0.6910205483436584, 0.706622302532196, 0.7222240567207336, 0.7378258109092712, 0.7534275650978088, 0.7690293192863464, 0.7846311330795288, 0.8002328872680664, 0.815834641456604, 0.8314363956451416, 0.8470381498336792, 0.8626399040222168, 0.8782416582107544, 0.893843412399292, 0.9094452261924744, 0.925046980381012, 0.9406487345695496, 0.9562504887580872, 0.9718522429466248, 0.9874540567398071]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 7.0, 10.0, 13.0, 12.0, 30.0, 34.0, 37.0, 70.0, 71.0, 76.0, 86.0, 77.0, 107.0, 74.0, 82.0, 50.0, 62.0, 33.0, 31.0, 23.0, 16.0, 4.0, 7.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05185270309448242, -0.05042874813079834, -0.04900478944182396, -0.04758083075284958, -0.0461568757891655, -0.044732920825481415, -0.043308962136507034, -0.041885003447532654, -0.04046104848384857, -0.03903709352016449, -0.03761313483119011, -0.03618917614221573, -0.03476522117853165, -0.033341266214847565, -0.031917307525873184, -0.030493350699543953, -0.02906939387321472, -0.02764543704688549, -0.02622148022055626, -0.024797523394227028, -0.023373566567897797, -0.021949609741568565, -0.020525652915239334, -0.019101696088910103, -0.01767773926258087, -0.01625378243625164, -0.014829825609922409, -0.013405868783593178, -0.011981911957263947, -0.010557955130934715, -0.009133998304605484, -0.007710041478276253, -0.0062860846519470215, -0.00486212782561779, -0.003438170999288559, -0.0020142141729593277, -0.0005902573466300964, 0.0008336994796991348, 0.002257656306028366, 0.0036816131323575974, 0.005105569958686829, 0.00652952678501606, 0.007953483611345291, 0.009377440437674522, 0.010801397264003754, 0.012225354090332985, 0.013649310916662216, 0.015073267742991447, 0.01649722456932068, 0.01792118139564991, 0.01934513822197914, 0.020769095048308372, 0.022193051874637604, 0.023617008700966835, 0.025040965527296066, 0.026464922353625298, 0.02788887917995453, 0.02931283600628376, 0.03073679283261299, 0.03216075152158737, 0.033584706485271454, 0.035008661448955536, 0.036432620137929916, 0.0378565788269043, 0.03928053379058838]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 8.0, 2.0, 4.0, 4.0, 5.0, 9.0, 13.0, 11.0, 17.0, 11.0, 20.0, 18.0, 19.0, 27.0, 21.0, 25.0, 33.0, 28.0, 32.0, 45.0, 43.0, 36.0, 30.0, 29.0, 38.0, 43.0, 36.0, 31.0, 33.0, 40.0, 34.0, 35.0, 37.0, 23.0, 30.0, 11.0, 24.0, 18.0, 17.0, 15.0, 8.0, 9.0, 8.0, 7.0, 4.0, 8.0, 5.0, 3.0, 1.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-8.890625, -8.606201171875, -8.32177734375, -8.037353515625, -7.7529296875, -7.468505859375, -7.18408203125, -6.899658203125, -6.615234375, -6.330810546875, -6.04638671875, -5.761962890625, -5.4775390625, -5.193115234375, -4.90869140625, -4.624267578125, -4.33984375, -4.055419921875, -3.77099609375, -3.486572265625, -3.2021484375, -2.917724609375, -2.63330078125, -2.348876953125, -2.064453125, -1.780029296875, -1.49560546875, -1.211181640625, -0.9267578125, -0.642333984375, -0.35791015625, -0.073486328125, 0.2109375, 0.495361328125, 0.77978515625, 1.064208984375, 1.3486328125, 1.633056640625, 1.91748046875, 2.201904296875, 2.486328125, 2.770751953125, 3.05517578125, 3.339599609375, 3.6240234375, 3.908447265625, 4.19287109375, 4.477294921875, 4.76171875, 5.046142578125, 5.33056640625, 5.614990234375, 5.8994140625, 6.183837890625, 6.46826171875, 6.752685546875, 7.037109375, 7.321533203125, 7.60595703125, 7.890380859375, 8.1748046875, 8.459228515625, 8.74365234375, 9.028076171875, 9.3125]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 8.0, 4.0, 4.0, 5.0, 5.0, 15.0, 19.0, 17.0, 41.0, 38.0, 75.0, 115.0, 154.0, 257.0, 420.0, 591.0, 979.0, 1581.0, 2693.0, 4632.0, 9056.0, 20927.0, 65333.0, 258723.0, 486852.0, 130674.0, 36321.0, 13544.0, 6349.0, 3494.0, 2149.0, 1278.0, 797.0, 494.0, 317.0, 178.0, 146.0, 86.0, 72.0, 35.0, 18.0, 17.0, 13.0, 11.0, 5.0, 8.0, 6.0, 3.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-8.40625, -8.1373291015625, -7.868408203125, -7.5994873046875, -7.33056640625, -7.0616455078125, -6.792724609375, -6.5238037109375, -6.2548828125, -5.9859619140625, -5.717041015625, -5.4481201171875, -5.17919921875, -4.9102783203125, -4.641357421875, -4.3724365234375, -4.103515625, -3.8345947265625, -3.565673828125, -3.2967529296875, -3.02783203125, -2.7589111328125, -2.489990234375, -2.2210693359375, -1.9521484375, -1.6832275390625, -1.414306640625, -1.1453857421875, -0.87646484375, -0.6075439453125, -0.338623046875, -0.0697021484375, 0.19921875, 0.4681396484375, 0.737060546875, 1.0059814453125, 1.27490234375, 1.5438232421875, 1.812744140625, 2.0816650390625, 2.3505859375, 2.6195068359375, 2.888427734375, 3.1573486328125, 3.42626953125, 3.6951904296875, 3.964111328125, 4.2330322265625, 4.501953125, 4.7708740234375, 5.039794921875, 5.3087158203125, 5.57763671875, 5.8465576171875, 6.115478515625, 6.3843994140625, 6.6533203125, 6.9222412109375, 7.191162109375, 7.4600830078125, 7.72900390625, 7.9979248046875, 8.266845703125, 8.5357666015625, 8.8046875]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 0.0, 1.0, 3.0, 5.0, 7.0, 4.0, 10.0, 18.0, 16.0, 11.0, 10.0, 18.0, 19.0, 27.0, 23.0, 33.0, 33.0, 40.0, 38.0, 49.0, 69.0, 97.0, 1618.0, 368.0, 98.0, 59.0, 53.0, 37.0, 42.0, 38.0, 33.0, 35.0, 22.0, 18.0, 27.0, 17.0, 9.0, 15.0, 8.0, 1.0, 5.0, 9.0, 2.0, 6.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-34.25, -33.1416015625, -32.033203125, -30.9248046875, -29.81640625, -28.7080078125, -27.599609375, -26.4912109375, -25.3828125, -24.2744140625, -23.166015625, -22.0576171875, -20.94921875, -19.8408203125, -18.732421875, -17.6240234375, -16.515625, -15.4072265625, -14.298828125, -13.1904296875, -12.08203125, -10.9736328125, -9.865234375, -8.7568359375, -7.6484375, -6.5400390625, -5.431640625, -4.3232421875, -3.21484375, -2.1064453125, -0.998046875, 0.1103515625, 1.21875, 2.3271484375, 3.435546875, 4.5439453125, 5.65234375, 6.7607421875, 7.869140625, 8.9775390625, 10.0859375, 11.1943359375, 12.302734375, 13.4111328125, 14.51953125, 15.6279296875, 16.736328125, 17.8447265625, 18.953125, 20.0615234375, 21.169921875, 22.2783203125, 23.38671875, 24.4951171875, 25.603515625, 26.7119140625, 27.8203125, 28.9287109375, 30.037109375, 31.1455078125, 32.25390625, 33.3623046875, 34.470703125, 35.5791015625, 36.6875]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 8.0, 10.0, 11.0, 8.0, 25.0, 15.0, 42.0, 52.0, 79.0, 108.0, 176.0, 300.0, 509.0, 2751.0, 2857132.0, 281409.0, 1878.0, 478.0, 233.0, 154.0, 104.0, 71.0, 36.0, 26.0, 22.0, 29.0, 8.0, 8.0, 9.0, 1.0, 4.0, 4.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-89.9375, -86.4677734375, -82.998046875, -79.5283203125, -76.05859375, -72.5888671875, -69.119140625, -65.6494140625, -62.1796875, -58.7099609375, -55.240234375, -51.7705078125, -48.30078125, -44.8310546875, -41.361328125, -37.8916015625, -34.421875, -30.9521484375, -27.482421875, -24.0126953125, -20.54296875, -17.0732421875, -13.603515625, -10.1337890625, -6.6640625, -3.1943359375, 0.275390625, 3.7451171875, 7.21484375, 10.6845703125, 14.154296875, 17.6240234375, 21.09375, 24.5634765625, 28.033203125, 31.5029296875, 34.97265625, 38.4423828125, 41.912109375, 45.3818359375, 48.8515625, 52.3212890625, 55.791015625, 59.2607421875, 62.73046875, 66.2001953125, 69.669921875, 73.1396484375, 76.609375, 80.0791015625, 83.548828125, 87.0185546875, 90.48828125, 93.9580078125, 97.427734375, 100.8974609375, 104.3671875, 107.8369140625, 111.306640625, 114.7763671875, 118.24609375, 121.7158203125, 125.185546875, 128.6552734375, 132.125]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 3.0, 11.0, 34.0, 89.0, 165.0, 237.0, 210.0, 146.0, 81.0, 28.0, 14.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.183643341064453, -10.430811882019043, -8.677980422973633, -6.925148010253906, -5.172316551208496, -3.419485092163086, -1.6666526794433594, 0.08617877960205078, 1.839010238647461, 3.59184193611145, 5.3446736335754395, 7.097505569458008, 8.850337028503418, 10.603168487548828, 12.356000900268555, 14.108832359313965, 15.861663818359375, 17.6144962310791, 19.367326736450195, 21.120159149169922, 22.872989654541016, 24.625822067260742, 26.37865447998047, 28.131484985351562, 29.88431739807129, 31.637149810791016, 33.38998031616211, 35.14281463623047, 36.89564514160156, 38.648475646972656, 40.40130615234375, 42.15414047241211, 43.90696716308594, 45.65979766845703, 47.41263198852539, 49.165462493896484, 50.91829299926758, 52.67112731933594, 54.42395782470703, 56.176788330078125, 57.92961883544922, 59.68244934082031, 61.43528366088867, 63.188114166259766, 64.94094848632812, 66.69377899169922, 68.44660949707031, 70.1994400024414, 71.9522705078125, 73.7051010131836, 75.45793151855469, 77.21076965332031, 78.9636001586914, 80.7164306640625, 82.4692611694336, 84.22209167480469, 85.97492980957031, 87.7277603149414, 89.4805908203125, 91.23342895507812, 92.98625946044922, 94.73908996582031, 96.4919204711914, 98.2447509765625, 99.9975814819336]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 4.0, 0.0, 5.0, 1.0, 3.0, 2.0, 1.0, 5.0, 3.0, 6.0, 9.0, 10.0, 10.0, 13.0, 18.0, 24.0, 14.0, 20.0, 27.0, 22.0, 27.0, 31.0, 24.0, 32.0, 48.0, 32.0, 51.0, 41.0, 44.0, 37.0, 46.0, 42.0, 53.0, 36.0, 37.0, 19.0, 34.0, 24.0, 20.0, 30.0, 20.0, 11.0, 18.0, 16.0, 13.0, 6.0, 5.0, 6.0, 3.0, 0.0, 3.0, 2.0, 2.0, 1.0, 4.0, 4.0, 1.0, 0.0, 0.0, 2.0], "bins": [-84.25794219970703, -81.59794616699219, -78.93795013427734, -76.2779541015625, -73.61795806884766, -70.95796203613281, -68.29796600341797, -65.63796997070312, -62.97797393798828, -60.31797790527344, -57.657981872558594, -54.99798583984375, -52.337989807128906, -49.67799377441406, -47.01799774169922, -44.358001708984375, -41.698001861572266, -39.03800582885742, -36.37800979614258, -33.718013763427734, -31.05801773071289, -28.398021697998047, -25.73802375793457, -23.078027725219727, -20.418031692504883, -17.75803565979004, -15.098039627075195, -12.438042640686035, -9.778046607971191, -7.118050575256348, -4.4580535888671875, -1.7980575561523438, 0.8619384765625, 3.521934747695923, 6.181931018829346, 8.841927528381348, 11.501923561096191, 14.161919593811035, 16.821916580200195, 19.48191261291504, 22.141908645629883, 24.801904678344727, 27.46190071105957, 30.121898651123047, 32.78189468383789, 35.441890716552734, 38.10188674926758, 40.76188278198242, 43.421878814697266, 46.08187484741211, 48.74187088012695, 51.4018669128418, 54.06186294555664, 56.721858978271484, 59.381858825683594, 62.04185485839844, 64.70185089111328, 67.36184692382812, 70.02184295654297, 72.68183898925781, 75.34183502197266, 78.0018310546875, 80.66182708740234, 83.32182312011719, 85.98181915283203]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 5.0, 3.0, 4.0, 5.0, 7.0, 3.0, 9.0, 7.0, 11.0, 17.0, 8.0, 13.0, 17.0, 28.0, 20.0, 26.0, 25.0, 35.0, 38.0, 24.0, 36.0, 50.0, 32.0, 40.0, 36.0, 42.0, 36.0, 33.0, 32.0, 28.0, 47.0, 44.0, 26.0, 34.0, 21.0, 21.0, 24.0, 25.0, 22.0, 16.0, 14.0, 10.0, 5.0, 10.0, 7.0, 6.0, 2.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.8671875, -8.5640869140625, -8.260986328125, -7.9578857421875, -7.65478515625, -7.3516845703125, -7.048583984375, -6.7454833984375, -6.4423828125, -6.1392822265625, -5.836181640625, -5.5330810546875, -5.22998046875, -4.9268798828125, -4.623779296875, -4.3206787109375, -4.017578125, -3.7144775390625, -3.411376953125, -3.1082763671875, -2.80517578125, -2.5020751953125, -2.198974609375, -1.8958740234375, -1.5927734375, -1.2896728515625, -0.986572265625, -0.6834716796875, -0.38037109375, -0.0772705078125, 0.225830078125, 0.5289306640625, 0.83203125, 1.1351318359375, 1.438232421875, 1.7413330078125, 2.04443359375, 2.3475341796875, 2.650634765625, 2.9537353515625, 3.2568359375, 3.5599365234375, 3.863037109375, 4.1661376953125, 4.46923828125, 4.7723388671875, 5.075439453125, 5.3785400390625, 5.681640625, 5.9847412109375, 6.287841796875, 6.5909423828125, 6.89404296875, 7.1971435546875, 7.500244140625, 7.8033447265625, 8.1064453125, 8.4095458984375, 8.712646484375, 9.0157470703125, 9.31884765625, 9.6219482421875, 9.925048828125, 10.2281494140625, 10.53125]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 1.0, 0.0, 3.0, 2.0, 11.0, 4.0, 16.0, 11.0, 13.0, 12.0, 15.0, 27.0, 21.0, 35.0, 41.0, 58.0, 64.0, 85.0, 140.0, 220.0, 381.0, 840.0, 2034.0, 6350.0, 27296.0, 178546.0, 1312902.0, 2140453.0, 449780.0, 57232.0, 11738.0, 3190.0, 1240.0, 581.0, 290.0, 152.0, 118.0, 78.0, 59.0, 64.0, 38.0, 36.0, 28.0, 15.0, 18.0, 15.0, 5.0, 4.0, 10.0, 7.0, 3.0, 2.0, 1.0, 5.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-19.3125, -18.69384765625, -18.0751953125, -17.45654296875, -16.837890625, -16.21923828125, -15.6005859375, -14.98193359375, -14.36328125, -13.74462890625, -13.1259765625, -12.50732421875, -11.888671875, -11.27001953125, -10.6513671875, -10.03271484375, -9.4140625, -8.79541015625, -8.1767578125, -7.55810546875, -6.939453125, -6.32080078125, -5.7021484375, -5.08349609375, -4.46484375, -3.84619140625, -3.2275390625, -2.60888671875, -1.990234375, -1.37158203125, -0.7529296875, -0.13427734375, 0.484375, 1.10302734375, 1.7216796875, 2.34033203125, 2.958984375, 3.57763671875, 4.1962890625, 4.81494140625, 5.43359375, 6.05224609375, 6.6708984375, 7.28955078125, 7.908203125, 8.52685546875, 9.1455078125, 9.76416015625, 10.3828125, 11.00146484375, 11.6201171875, 12.23876953125, 12.857421875, 13.47607421875, 14.0947265625, 14.71337890625, 15.33203125, 15.95068359375, 16.5693359375, 17.18798828125, 17.806640625, 18.42529296875, 19.0439453125, 19.66259765625, 20.28125]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 1.0, 5.0, 9.0, 15.0, 15.0, 17.0, 19.0, 28.0, 37.0, 53.0, 83.0, 99.0, 135.0, 192.0, 259.0, 315.0, 368.0, 454.0, 471.0, 375.0, 288.0, 230.0, 146.0, 132.0, 83.0, 61.0, 50.0, 36.0, 26.0, 15.0, 13.0, 12.0, 9.0, 8.0, 4.0, 6.0, 5.0, 0.0, 2.0, 3.0, 2.0, 2.0], "bins": [-23.015625, -22.43701171875, -21.8583984375, -21.27978515625, -20.701171875, -20.12255859375, -19.5439453125, -18.96533203125, -18.38671875, -17.80810546875, -17.2294921875, -16.65087890625, -16.072265625, -15.49365234375, -14.9150390625, -14.33642578125, -13.7578125, -13.17919921875, -12.6005859375, -12.02197265625, -11.443359375, -10.86474609375, -10.2861328125, -9.70751953125, -9.12890625, -8.55029296875, -7.9716796875, -7.39306640625, -6.814453125, -6.23583984375, -5.6572265625, -5.07861328125, -4.5, -3.92138671875, -3.3427734375, -2.76416015625, -2.185546875, -1.60693359375, -1.0283203125, -0.44970703125, 0.12890625, 0.70751953125, 1.2861328125, 1.86474609375, 2.443359375, 3.02197265625, 3.6005859375, 4.17919921875, 4.7578125, 5.33642578125, 5.9150390625, 6.49365234375, 7.072265625, 7.65087890625, 8.2294921875, 8.80810546875, 9.38671875, 9.96533203125, 10.5439453125, 11.12255859375, 11.701171875, 12.27978515625, 12.8583984375, 13.43701171875, 14.015625]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 3.0, 0.0, 5.0, 5.0, 9.0, 5.0, 11.0, 16.0, 12.0, 17.0, 36.0, 48.0, 55.0, 69.0, 123.0, 172.0, 236.0, 379.0, 832.0, 5939.0, 882069.0, 3284911.0, 16780.0, 1138.0, 490.0, 261.0, 191.0, 135.0, 105.0, 72.0, 48.0, 29.0, 23.0, 19.0, 13.0, 13.0, 8.0, 7.0, 2.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.6875, -63.07421875, -60.4609375, -57.84765625, -55.234375, -52.62109375, -50.0078125, -47.39453125, -44.78125, -42.16796875, -39.5546875, -36.94140625, -34.328125, -31.71484375, -29.1015625, -26.48828125, -23.875, -21.26171875, -18.6484375, -16.03515625, -13.421875, -10.80859375, -8.1953125, -5.58203125, -2.96875, -0.35546875, 2.2578125, 4.87109375, 7.484375, 10.09765625, 12.7109375, 15.32421875, 17.9375, 20.55078125, 23.1640625, 25.77734375, 28.390625, 31.00390625, 33.6171875, 36.23046875, 38.84375, 41.45703125, 44.0703125, 46.68359375, 49.296875, 51.91015625, 54.5234375, 57.13671875, 59.75, 62.36328125, 64.9765625, 67.58984375, 70.203125, 72.81640625, 75.4296875, 78.04296875, 80.65625, 83.26953125, 85.8828125, 88.49609375, 91.109375, 93.72265625, 96.3359375, 98.94921875, 101.5625]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 6.0, 29.0, 59.0, 104.0, 152.0, 194.0, 168.0, 143.0, 83.0, 41.0, 17.0, 14.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-109.11027526855469, -104.53605651855469, -99.96183776855469, -95.38761901855469, -90.81340026855469, -86.23918151855469, -81.66495513916016, -77.09073638916016, -72.51651763916016, -67.94229888916016, -63.368080139160156, -58.79385757446289, -54.21963882446289, -49.64542007446289, -45.071197509765625, -40.496978759765625, -35.922760009765625, -31.348541259765625, -26.774320602416992, -22.20009994506836, -17.62588119506836, -13.05166244506836, -8.477441787719727, -3.9032211303710938, 0.6709976196289062, 5.245217323303223, 9.819437026977539, 14.393656730651855, 18.967876434326172, 23.542095184326172, 28.116315841674805, 32.69053649902344, 37.2647705078125, 41.8389892578125, 46.4132080078125, 50.987430572509766, 55.561649322509766, 60.135868072509766, 64.71009063720703, 69.28430938720703, 73.85852813720703, 78.43274688720703, 83.00696563720703, 87.58118438720703, 92.15541076660156, 96.72962951660156, 101.30384826660156, 105.87806701660156, 110.45228576660156, 115.02650451660156, 119.60072326660156, 124.17494201660156, 128.74916076660156, 133.32337951660156, 137.89759826660156, 142.47183227539062, 147.04605102539062, 151.62026977539062, 156.19448852539062, 160.76870727539062, 165.34292602539062, 169.91714477539062, 174.49136352539062, 179.06558227539062, 183.63980102539062]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 3.0, 6.0, 4.0, 10.0, 9.0, 15.0, 13.0, 14.0, 20.0, 21.0, 23.0, 32.0, 21.0, 26.0, 31.0, 30.0, 26.0, 43.0, 28.0, 38.0, 36.0, 44.0, 50.0, 48.0, 55.0, 51.0, 33.0, 44.0, 34.0, 25.0, 38.0, 27.0, 19.0, 21.0, 13.0, 12.0, 11.0, 11.0, 7.0, 5.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.7603759765625, -62.68702697753906, -60.613677978515625, -58.54032516479492, -56.466976165771484, -54.39362716674805, -52.320274353027344, -50.246925354003906, -48.17357635498047, -46.10022735595703, -44.026878356933594, -41.95352554321289, -39.88017654418945, -37.806827545166016, -35.73347473144531, -33.660125732421875, -31.586776733398438, -29.513427734375, -27.44007682800293, -25.36672592163086, -23.293376922607422, -21.220027923583984, -19.146677017211914, -17.073326110839844, -14.999977111816406, -12.926627159118652, -10.853277206420898, -8.779927253723145, -6.706577301025391, -4.633227348327637, -2.559877395629883, -0.4865274429321289, 1.586822509765625, 3.660172462463379, 5.733522415161133, 7.806872367858887, 9.88022232055664, 11.953572273254395, 14.026922225952148, 16.10027313232422, 18.173622131347656, 20.246971130371094, 22.320322036743164, 24.393672943115234, 26.467021942138672, 28.54037094116211, 30.61372184753418, 32.68707275390625, 34.76042175292969, 36.833770751953125, 38.90711975097656, 40.980472564697266, 43.0538215637207, 45.12717056274414, 47.200523376464844, 49.27387237548828, 51.34722137451172, 53.420570373535156, 55.493919372558594, 57.5672721862793, 59.640621185302734, 61.71397018432617, 63.787322998046875, 65.86067199707031, 67.93402099609375]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 2.0, 2.0, 9.0, 4.0, 10.0, 14.0, 10.0, 12.0, 13.0, 15.0, 19.0, 23.0, 24.0, 22.0, 23.0, 27.0, 31.0, 34.0, 34.0, 41.0, 31.0, 36.0, 36.0, 33.0, 31.0, 22.0, 47.0, 45.0, 34.0, 21.0, 35.0, 24.0, 31.0, 31.0, 21.0, 22.0, 30.0, 12.0, 10.0, 19.0, 16.0, 8.0, 12.0, 6.0, 6.0, 3.0, 3.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-8.8984375, -8.6199951171875, -8.341552734375, -8.0631103515625, -7.78466796875, -7.5062255859375, -7.227783203125, -6.9493408203125, -6.6708984375, -6.3924560546875, -6.114013671875, -5.8355712890625, -5.55712890625, -5.2786865234375, -5.000244140625, -4.7218017578125, -4.443359375, -4.1649169921875, -3.886474609375, -3.6080322265625, -3.32958984375, -3.0511474609375, -2.772705078125, -2.4942626953125, -2.2158203125, -1.9373779296875, -1.658935546875, -1.3804931640625, -1.10205078125, -0.8236083984375, -0.545166015625, -0.2667236328125, 0.01171875, 0.2901611328125, 0.568603515625, 0.8470458984375, 1.12548828125, 1.4039306640625, 1.682373046875, 1.9608154296875, 2.2392578125, 2.5177001953125, 2.796142578125, 3.0745849609375, 3.35302734375, 3.6314697265625, 3.909912109375, 4.1883544921875, 4.466796875, 4.7452392578125, 5.023681640625, 5.3021240234375, 5.58056640625, 5.8590087890625, 6.137451171875, 6.4158935546875, 6.6943359375, 6.9727783203125, 7.251220703125, 7.5296630859375, 7.80810546875, 8.0865478515625, 8.364990234375, 8.6434326171875, 8.921875]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 3.0, 0.0, 10.0, 4.0, 11.0, 22.0, 24.0, 51.0, 58.0, 97.0, 158.0, 238.0, 364.0, 540.0, 767.0, 1109.0, 1760.0, 2628.0, 3951.0, 5874.0, 9026.0, 13912.0, 21021.0, 32258.0, 49882.0, 76009.0, 112694.0, 152450.0, 164224.0, 132193.0, 91781.0, 60455.0, 39663.0, 25960.0, 16782.0, 10970.0, 7310.0, 4851.0, 3201.0, 2065.0, 1430.0, 933.0, 646.0, 413.0, 254.0, 161.0, 120.0, 77.0, 56.0, 35.0, 28.0, 11.0, 9.0, 6.0, 5.0, 5.0, 2.0, 0.0, 1.0, 3.0], "bins": [-0.74169921875, -0.71868896484375, -0.6956787109375, -0.67266845703125, -0.649658203125, -0.62664794921875, -0.6036376953125, -0.58062744140625, -0.5576171875, -0.53460693359375, -0.5115966796875, -0.48858642578125, -0.465576171875, -0.44256591796875, -0.4195556640625, -0.39654541015625, -0.37353515625, -0.35052490234375, -0.3275146484375, -0.30450439453125, -0.281494140625, -0.25848388671875, -0.2354736328125, -0.21246337890625, -0.189453125, -0.16644287109375, -0.1434326171875, -0.12042236328125, -0.097412109375, -0.07440185546875, -0.0513916015625, -0.02838134765625, -0.00537109375, 0.01763916015625, 0.0406494140625, 0.06365966796875, 0.086669921875, 0.10968017578125, 0.1326904296875, 0.15570068359375, 0.1787109375, 0.20172119140625, 0.2247314453125, 0.24774169921875, 0.270751953125, 0.29376220703125, 0.3167724609375, 0.33978271484375, 0.36279296875, 0.38580322265625, 0.4088134765625, 0.43182373046875, 0.454833984375, 0.47784423828125, 0.5008544921875, 0.52386474609375, 0.546875, 0.56988525390625, 0.5928955078125, 0.61590576171875, 0.638916015625, 0.66192626953125, 0.6849365234375, 0.70794677734375, 0.73095703125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 5.0, 0.0, 5.0, 2.0, 6.0, 6.0, 9.0, 9.0, 13.0, 12.0, 12.0, 22.0, 26.0, 28.0, 25.0, 23.0, 37.0, 33.0, 34.0, 42.0, 43.0, 42.0, 1071.0, 43.0, 33.0, 59.0, 34.0, 37.0, 33.0, 43.0, 35.0, 25.0, 27.0, 33.0, 29.0, 14.0, 15.0, 18.0, 15.0, 7.0, 7.0, 7.0, 1.0, 5.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.9609375, -6.74285888671875, -6.5247802734375, -6.30670166015625, -6.088623046875, -5.87054443359375, -5.6524658203125, -5.43438720703125, -5.21630859375, -4.99822998046875, -4.7801513671875, -4.56207275390625, -4.343994140625, -4.12591552734375, -3.9078369140625, -3.68975830078125, -3.4716796875, -3.25360107421875, -3.0355224609375, -2.81744384765625, -2.599365234375, -2.38128662109375, -2.1632080078125, -1.94512939453125, -1.72705078125, -1.50897216796875, -1.2908935546875, -1.07281494140625, -0.854736328125, -0.63665771484375, -0.4185791015625, -0.20050048828125, 0.017578125, 0.23565673828125, 0.4537353515625, 0.67181396484375, 0.889892578125, 1.10797119140625, 1.3260498046875, 1.54412841796875, 1.76220703125, 1.98028564453125, 2.1983642578125, 2.41644287109375, 2.634521484375, 2.85260009765625, 3.0706787109375, 3.28875732421875, 3.5068359375, 3.72491455078125, 3.9429931640625, 4.16107177734375, 4.379150390625, 4.59722900390625, 4.8153076171875, 5.03338623046875, 5.25146484375, 5.46954345703125, 5.6876220703125, 5.90570068359375, 6.123779296875, 6.34185791015625, 6.5599365234375, 6.77801513671875, 6.99609375]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 4.0, 8.0, 10.0, 13.0, 26.0, 24.0, 37.0, 63.0, 85.0, 135.0, 179.0, 286.0, 486.0, 647.0, 1012.0, 1501.0, 2201.0, 3396.0, 5180.0, 7823.0, 12285.0, 18631.0, 28664.0, 43884.0, 65643.0, 95401.0, 134552.0, 1119125.0, 207778.0, 112490.0, 79539.0, 53658.0, 35748.0, 22934.0, 15043.0, 9699.0, 6421.0, 4227.0, 2808.0, 1852.0, 1231.0, 778.0, 524.0, 342.0, 257.0, 167.0, 107.0, 65.0, 56.0, 40.0, 31.0, 18.0, 10.0, 8.0, 6.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.50244140625, -0.4866180419921875, -0.470794677734375, -0.4549713134765625, -0.43914794921875, -0.4233245849609375, -0.407501220703125, -0.3916778564453125, -0.3758544921875, -0.3600311279296875, -0.344207763671875, -0.3283843994140625, -0.31256103515625, -0.2967376708984375, -0.280914306640625, -0.2650909423828125, -0.249267578125, -0.2334442138671875, -0.217620849609375, -0.2017974853515625, -0.18597412109375, -0.1701507568359375, -0.154327392578125, -0.1385040283203125, -0.1226806640625, -0.1068572998046875, -0.091033935546875, -0.0752105712890625, -0.05938720703125, -0.0435638427734375, -0.027740478515625, -0.0119171142578125, 0.00390625, 0.0197296142578125, 0.035552978515625, 0.0513763427734375, 0.06719970703125, 0.0830230712890625, 0.098846435546875, 0.1146697998046875, 0.1304931640625, 0.1463165283203125, 0.162139892578125, 0.1779632568359375, 0.19378662109375, 0.2096099853515625, 0.225433349609375, 0.2412567138671875, 0.257080078125, 0.2729034423828125, 0.288726806640625, 0.3045501708984375, 0.32037353515625, 0.3361968994140625, 0.352020263671875, 0.3678436279296875, 0.3836669921875, 0.3994903564453125, 0.415313720703125, 0.4311370849609375, 0.44696044921875, 0.4627838134765625, 0.478607177734375, 0.4944305419921875, 0.51025390625]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 5.0, 6.0, 6.0, 7.0, 9.0, 3.0, 7.0, 9.0, 13.0, 14.0, 11.0, 12.0, 20.0, 18.0, 26.0, 48.0, 77.0, 86.0, 126.0, 126.0, 98.0, 75.0, 37.0, 22.0, 24.0, 15.0, 13.0, 11.0, 10.0, 15.0, 10.0, 9.0, 4.0, 3.0, 5.0, 9.0, 7.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0281219482421875, -0.02724146842956543, -0.02636098861694336, -0.02548050880432129, -0.02460002899169922, -0.02371954917907715, -0.022839069366455078, -0.021958589553833008, -0.021078109741210938, -0.020197629928588867, -0.019317150115966797, -0.018436670303344727, -0.017556190490722656, -0.016675710678100586, -0.015795230865478516, -0.014914751052856445, -0.014034271240234375, -0.013153791427612305, -0.012273311614990234, -0.011392831802368164, -0.010512351989746094, -0.009631872177124023, -0.008751392364501953, -0.007870912551879883, -0.0069904327392578125, -0.006109952926635742, -0.005229473114013672, -0.0043489933013916016, -0.0034685134887695312, -0.002588033676147461, -0.0017075538635253906, -0.0008270740509033203, 5.340576171875e-05, 0.0009338855743408203, 0.0018143653869628906, 0.002694845199584961, 0.0035753250122070312, 0.0044558048248291016, 0.005336284637451172, 0.006216764450073242, 0.0070972442626953125, 0.007977724075317383, 0.008858203887939453, 0.009738683700561523, 0.010619163513183594, 0.011499643325805664, 0.012380123138427734, 0.013260602951049805, 0.014141082763671875, 0.015021562576293945, 0.015902042388916016, 0.016782522201538086, 0.017663002014160156, 0.018543481826782227, 0.019423961639404297, 0.020304441452026367, 0.021184921264648438, 0.022065401077270508, 0.022945880889892578, 0.02382636070251465, 0.02470684051513672, 0.02558732032775879, 0.02646780014038086, 0.02734827995300293, 0.028228759765625]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 9.0, 10.0, 4.0, 7.0, 7.0, 10.0, 15.0, 20.0, 21.0, 20.0, 30.0, 37.0, 48.0, 61.0, 143.0, 330.0, 1363.0, 522036.0, 522214.0, 1362.0, 337.0, 165.0, 62.0, 42.0, 39.0, 25.0, 20.0, 22.0, 24.0, 16.0, 10.0, 4.0, 12.0, 4.0, 12.0, 4.0, 6.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.583984375, -0.56573486328125, -0.5474853515625, -0.52923583984375, -0.510986328125, -0.49273681640625, -0.4744873046875, -0.45623779296875, -0.43798828125, -0.41973876953125, -0.4014892578125, -0.38323974609375, -0.364990234375, -0.34674072265625, -0.3284912109375, -0.31024169921875, -0.2919921875, -0.27374267578125, -0.2554931640625, -0.23724365234375, -0.218994140625, -0.20074462890625, -0.1824951171875, -0.16424560546875, -0.14599609375, -0.12774658203125, -0.1094970703125, -0.09124755859375, -0.072998046875, -0.05474853515625, -0.0364990234375, -0.01824951171875, 0.0, 0.01824951171875, 0.0364990234375, 0.05474853515625, 0.072998046875, 0.09124755859375, 0.1094970703125, 0.12774658203125, 0.14599609375, 0.16424560546875, 0.1824951171875, 0.20074462890625, 0.218994140625, 0.23724365234375, 0.2554931640625, 0.27374267578125, 0.2919921875, 0.31024169921875, 0.3284912109375, 0.34674072265625, 0.364990234375, 0.38323974609375, 0.4014892578125, 0.41973876953125, 0.43798828125, 0.45623779296875, 0.4744873046875, 0.49273681640625, 0.510986328125, 0.52923583984375, 0.5474853515625, 0.56573486328125, 0.583984375]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 376.0, 638.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0387532003223896, -0.026014698669314384, -0.013276197016239166, -0.0005376972258090973, 0.01220080628991127, 0.024939309805631638, 0.03767780587077141, 0.050416309386491776, 0.06315481662750244, 0.07589332014322281, 0.08863182365894318, 0.10137031972408295, 0.11410882323980331, 0.12684732675552368, 0.13958582282066345, 0.15232431888580322, 0.1650628298521042, 0.17780132591724396, 0.19053983688354492, 0.2032783329486847, 0.21601682901382446, 0.22875533998012543, 0.2414938360452652, 0.25423234701156616, 0.26697084307670593, 0.2797093391418457, 0.2924478352069855, 0.30518633127212524, 0.3179248571395874, 0.3306633532047272, 0.34340184926986694, 0.3561403453350067, 0.3688788414001465, 0.38161733746528625, 0.394355833530426, 0.4070943593978882, 0.41983285546302795, 0.4325713515281677, 0.4453098475933075, 0.45804834365844727, 0.4707868695259094, 0.4835253655910492, 0.49626386165618896, 0.5090023875236511, 0.5217408537864685, 0.5344793796539307, 0.547217845916748, 0.5599563717842102, 0.5726948976516724, 0.5854334235191345, 0.5981718897819519, 0.6109104156494141, 0.6236488819122314, 0.6363874077796936, 0.6491259336471558, 0.6618643999099731, 0.6746028661727905, 0.6873413920402527, 0.7000798583030701, 0.7128183841705322, 0.7255568504333496, 0.7382953763008118, 0.7510339021682739, 0.7637723684310913, 0.7765108942985535]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 6.0, 16.0, 27.0, 28.0, 36.0, 53.0, 54.0, 79.0, 68.0, 78.0, 81.0, 99.0, 86.0, 75.0, 64.0, 50.0, 34.0, 23.0, 23.0, 13.0, 4.0, 6.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.037107884883880615, -0.03602931648492813, -0.03495074436068535, -0.033872172236442566, -0.03279360383749008, -0.0317150354385376, -0.030636463314294815, -0.02955789305269718, -0.02847932279109955, -0.027400752529501915, -0.02632218226790428, -0.025243612006306648, -0.024165041744709015, -0.02308647148311138, -0.022007901221513748, -0.020929330959916115, -0.01985076069831848, -0.018772190436720848, -0.017693620175123215, -0.01661504991352558, -0.015536479651927948, -0.014457909390330315, -0.013379339128732681, -0.012300768867135048, -0.011222198605537415, -0.010143628343939781, -0.009065058082342148, -0.007986487820744514, -0.006907917559146881, -0.005829347297549248, -0.004750777035951614, -0.003672206774353981, -0.0025936365127563477, -0.0015150662511587143, -0.00043649598956108093, 0.0006420742720365524, 0.0017206445336341858, 0.002799214795231819, 0.0038777850568294525, 0.004956355318427086, 0.006034925580024719, 0.007113495841622353, 0.008192066103219986, 0.00927063636481762, 0.010349206626415253, 0.011427776888012886, 0.01250634714961052, 0.013584917411208153, 0.014663487672805786, 0.01574205793440342, 0.016820628196001053, 0.017899198457598686, 0.01897776871919632, 0.020056338980793953, 0.021134909242391586, 0.02221347950398922, 0.023292049765586853, 0.024370620027184486, 0.02544919028878212, 0.026527760550379753, 0.027606330811977386, 0.02868490107357502, 0.029763471335172653, 0.030842041596770287, 0.03192061185836792]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 2.0, 2.0, 9.0, 4.0, 10.0, 14.0, 10.0, 12.0, 13.0, 15.0, 19.0, 23.0, 24.0, 22.0, 23.0, 27.0, 31.0, 33.0, 35.0, 41.0, 31.0, 35.0, 37.0, 32.0, 32.0, 22.0, 47.0, 45.0, 34.0, 21.0, 35.0, 24.0, 31.0, 31.0, 21.0, 22.0, 30.0, 12.0, 10.0, 19.0, 16.0, 8.0, 12.0, 6.0, 6.0, 3.0, 3.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-8.8984375, -8.6199951171875, -8.341552734375, -8.0631103515625, -7.78466796875, -7.5062255859375, -7.227783203125, -6.9493408203125, -6.6708984375, -6.3924560546875, -6.114013671875, -5.8355712890625, -5.55712890625, -5.2786865234375, -5.000244140625, -4.7218017578125, -4.443359375, -4.1649169921875, -3.886474609375, -3.6080322265625, -3.32958984375, -3.0511474609375, -2.772705078125, -2.4942626953125, -2.2158203125, -1.9373779296875, -1.658935546875, -1.3804931640625, -1.10205078125, -0.8236083984375, -0.545166015625, -0.2667236328125, 0.01171875, 0.2901611328125, 0.568603515625, 0.8470458984375, 1.12548828125, 1.4039306640625, 1.682373046875, 1.9608154296875, 2.2392578125, 2.5177001953125, 2.796142578125, 3.0745849609375, 3.35302734375, 3.6314697265625, 3.909912109375, 4.1883544921875, 4.466796875, 4.7452392578125, 5.023681640625, 5.3021240234375, 5.58056640625, 5.8590087890625, 6.137451171875, 6.4158935546875, 6.6943359375, 6.9727783203125, 7.251220703125, 7.5296630859375, 7.80810546875, 8.0865478515625, 8.364990234375, 8.6434326171875, 8.921875]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 8.0, 8.0, 11.0, 19.0, 18.0, 25.0, 46.0, 59.0, 71.0, 120.0, 155.0, 204.0, 307.0, 493.0, 702.0, 1054.0, 1609.0, 2615.0, 4276.0, 7369.0, 12633.0, 23499.0, 49477.0, 122754.0, 309119.0, 293311.0, 117159.0, 47653.0, 23125.0, 12282.0, 6931.0, 4025.0, 2558.0, 1580.0, 1074.0, 693.0, 460.0, 323.0, 219.0, 148.0, 116.0, 81.0, 57.0, 37.0, 25.0, 15.0, 11.0, 6.0, 4.0, 9.0, 4.0, 6.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.3515625, -7.12164306640625, -6.8917236328125, -6.66180419921875, -6.431884765625, -6.20196533203125, -5.9720458984375, -5.74212646484375, -5.51220703125, -5.28228759765625, -5.0523681640625, -4.82244873046875, -4.592529296875, -4.36260986328125, -4.1326904296875, -3.90277099609375, -3.6728515625, -3.44293212890625, -3.2130126953125, -2.98309326171875, -2.753173828125, -2.52325439453125, -2.2933349609375, -2.06341552734375, -1.83349609375, -1.60357666015625, -1.3736572265625, -1.14373779296875, -0.913818359375, -0.68389892578125, -0.4539794921875, -0.22406005859375, 0.005859375, 0.23577880859375, 0.4656982421875, 0.69561767578125, 0.925537109375, 1.15545654296875, 1.3853759765625, 1.61529541015625, 1.84521484375, 2.07513427734375, 2.3050537109375, 2.53497314453125, 2.764892578125, 2.99481201171875, 3.2247314453125, 3.45465087890625, 3.6845703125, 3.91448974609375, 4.1444091796875, 4.37432861328125, 4.604248046875, 4.83416748046875, 5.0640869140625, 5.29400634765625, 5.52392578125, 5.75384521484375, 5.9837646484375, 6.21368408203125, 6.443603515625, 6.67352294921875, 6.9034423828125, 7.13336181640625, 7.36328125]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 2.0, 3.0, 5.0, 6.0, 7.0, 12.0, 13.0, 14.0, 20.0, 14.0, 19.0, 26.0, 29.0, 37.0, 39.0, 59.0, 42.0, 64.0, 88.0, 301.0, 1640.0, 131.0, 74.0, 56.0, 49.0, 48.0, 41.0, 30.0, 35.0, 24.0, 19.0, 18.0, 14.0, 19.0, 15.0, 9.0, 7.0, 6.0, 5.0, 6.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-40.0625, -38.8583984375, -37.654296875, -36.4501953125, -35.24609375, -34.0419921875, -32.837890625, -31.6337890625, -30.4296875, -29.2255859375, -28.021484375, -26.8173828125, -25.61328125, -24.4091796875, -23.205078125, -22.0009765625, -20.796875, -19.5927734375, -18.388671875, -17.1845703125, -15.98046875, -14.7763671875, -13.572265625, -12.3681640625, -11.1640625, -9.9599609375, -8.755859375, -7.5517578125, -6.34765625, -5.1435546875, -3.939453125, -2.7353515625, -1.53125, -0.3271484375, 0.876953125, 2.0810546875, 3.28515625, 4.4892578125, 5.693359375, 6.8974609375, 8.1015625, 9.3056640625, 10.509765625, 11.7138671875, 12.91796875, 14.1220703125, 15.326171875, 16.5302734375, 17.734375, 18.9384765625, 20.142578125, 21.3466796875, 22.55078125, 23.7548828125, 24.958984375, 26.1630859375, 27.3671875, 28.5712890625, 29.775390625, 30.9794921875, 32.18359375, 33.3876953125, 34.591796875, 35.7958984375, 37.0]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 5.0, 0.0, 0.0, 3.0, 0.0, 4.0, 3.0, 5.0, 10.0, 6.0, 14.0, 26.0, 23.0, 24.0, 24.0, 32.0, 50.0, 63.0, 108.0, 132.0, 162.0, 216.0, 341.0, 943.0, 10122.0, 3028891.0, 101140.0, 1921.0, 476.0, 265.0, 187.0, 131.0, 88.0, 70.0, 51.0, 32.0, 34.0, 20.0, 29.0, 20.0, 17.0, 8.0, 7.0, 6.0, 1.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-87.875, -85.0146484375, -82.154296875, -79.2939453125, -76.43359375, -73.5732421875, -70.712890625, -67.8525390625, -64.9921875, -62.1318359375, -59.271484375, -56.4111328125, -53.55078125, -50.6904296875, -47.830078125, -44.9697265625, -42.109375, -39.2490234375, -36.388671875, -33.5283203125, -30.66796875, -27.8076171875, -24.947265625, -22.0869140625, -19.2265625, -16.3662109375, -13.505859375, -10.6455078125, -7.78515625, -4.9248046875, -2.064453125, 0.7958984375, 3.65625, 6.5166015625, 9.376953125, 12.2373046875, 15.09765625, 17.9580078125, 20.818359375, 23.6787109375, 26.5390625, 29.3994140625, 32.259765625, 35.1201171875, 37.98046875, 40.8408203125, 43.701171875, 46.5615234375, 49.421875, 52.2822265625, 55.142578125, 58.0029296875, 60.86328125, 63.7236328125, 66.583984375, 69.4443359375, 72.3046875, 75.1650390625, 78.025390625, 80.8857421875, 83.74609375, 86.6064453125, 89.466796875, 92.3271484375, 95.1875]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [17.0, 405.0, 564.0, 32.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.939311981201172, -9.50727653503418, -1.0752410888671875, 7.356794357299805, 15.788829803466797, 24.220867156982422, 32.65290069580078, 41.08493423461914, 49.516971588134766, 57.949005126953125, 66.38104248046875, 74.81307983398438, 83.2451171875, 91.67715454101562, 100.10918426513672, 108.54121398925781, 116.97325134277344, 125.40528869628906, 133.8373260498047, 142.2693634033203, 150.70138549804688, 159.1334228515625, 167.56546020507812, 175.99749755859375, 184.42953491210938, 192.861572265625, 201.29360961914062, 209.72564697265625, 218.15768432617188, 226.5897216796875, 235.02174377441406, 243.4537811279297, 251.88580322265625, 260.3178405761719, 268.7498779296875, 277.1819152832031, 285.61395263671875, 294.0459899902344, 302.47802734375, 310.9100341796875, 319.34210205078125, 327.7741394042969, 336.2061767578125, 344.6382141113281, 353.07025146484375, 361.5022888183594, 369.934326171875, 378.3663330078125, 386.7983703613281, 395.23040771484375, 403.6624450683594, 412.094482421875, 420.5265197753906, 428.95855712890625, 437.3905944824219, 445.8226318359375, 454.254638671875, 462.6866760253906, 471.11871337890625, 479.5507507324219, 487.9827880859375, 496.4148254394531, 504.84686279296875, 513.2788696289062, 521.7109375]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 5.0, 3.0, 3.0, 12.0, 12.0, 13.0, 11.0, 13.0, 13.0, 19.0, 16.0, 26.0, 35.0, 32.0, 31.0, 38.0, 44.0, 46.0, 33.0, 39.0, 50.0, 46.0, 35.0, 56.0, 36.0, 39.0, 40.0, 34.0, 29.0, 27.0, 24.0, 19.0, 28.0, 23.0, 17.0, 14.0, 9.0, 13.0, 4.0, 5.0, 5.0, 3.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-90.13233184814453, -87.25057220458984, -84.36881256103516, -81.48704528808594, -78.60528564453125, -75.72352600097656, -72.84176635742188, -69.96000671386719, -67.0782470703125, -64.19648742675781, -61.31472396850586, -58.43296432495117, -55.55120086669922, -52.66944122314453, -49.787681579589844, -46.905921936035156, -44.02415466308594, -41.14239501953125, -38.2606315612793, -35.37887191772461, -32.497108459472656, -29.61534881591797, -26.73358917236328, -23.85182762145996, -20.97006607055664, -18.08830451965332, -15.206543922424316, -12.324783325195312, -9.443021774291992, -6.561260223388672, -3.6795005798339844, -0.7977390289306641, 2.0840225219726562, 4.965783596038818, 7.8475446701049805, 10.729305267333984, 13.611066818237305, 16.492828369140625, 19.374588012695312, 22.256349563598633, 25.138111114501953, 28.019872665405273, 30.901634216308594, 33.78339385986328, 36.66515350341797, 39.54691696166992, 42.42867660522461, 45.31044006347656, 48.19219970703125, 51.07395935058594, 53.95572280883789, 56.83748245239258, 59.71924591064453, 62.60100555419922, 65.4827651977539, 68.3645248413086, 71.24629211425781, 74.1280517578125, 77.00981140136719, 79.89157104492188, 82.7733383178711, 85.65509796142578, 88.53685760498047, 91.41861724853516, 94.30037689208984]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 4.0, 4.0, 8.0, 5.0, 7.0, 9.0, 15.0, 13.0, 9.0, 21.0, 13.0, 22.0, 33.0, 25.0, 32.0, 30.0, 20.0, 37.0, 39.0, 37.0, 39.0, 44.0, 37.0, 31.0, 42.0, 43.0, 28.0, 32.0, 33.0, 34.0, 29.0, 32.0, 33.0, 32.0, 20.0, 17.0, 11.0, 18.0, 17.0, 17.0, 7.0, 5.0, 6.0, 4.0, 4.0, 5.0, 5.0, 2.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0], "bins": [-10.0546875, -9.741943359375, -9.42919921875, -9.116455078125, -8.8037109375, -8.490966796875, -8.17822265625, -7.865478515625, -7.552734375, -7.239990234375, -6.92724609375, -6.614501953125, -6.3017578125, -5.989013671875, -5.67626953125, -5.363525390625, -5.05078125, -4.738037109375, -4.42529296875, -4.112548828125, -3.7998046875, -3.487060546875, -3.17431640625, -2.861572265625, -2.548828125, -2.236083984375, -1.92333984375, -1.610595703125, -1.2978515625, -0.985107421875, -0.67236328125, -0.359619140625, -0.046875, 0.265869140625, 0.57861328125, 0.891357421875, 1.2041015625, 1.516845703125, 1.82958984375, 2.142333984375, 2.455078125, 2.767822265625, 3.08056640625, 3.393310546875, 3.7060546875, 4.018798828125, 4.33154296875, 4.644287109375, 4.95703125, 5.269775390625, 5.58251953125, 5.895263671875, 6.2080078125, 6.520751953125, 6.83349609375, 7.146240234375, 7.458984375, 7.771728515625, 8.08447265625, 8.397216796875, 8.7099609375, 9.022705078125, 9.33544921875, 9.648193359375, 9.9609375]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 4.0, 7.0, 1.0, 3.0, 6.0, 6.0, 9.0, 8.0, 9.0, 11.0, 16.0, 27.0, 27.0, 23.0, 37.0, 40.0, 43.0, 52.0, 98.0, 167.0, 388.0, 1062.0, 4135.0, 24780.0, 336664.0, 2843384.0, 919550.0, 53387.0, 7240.0, 1727.0, 632.0, 240.0, 117.0, 79.0, 63.0, 51.0, 38.0, 22.0, 24.0, 28.0, 12.0, 11.0, 14.0, 8.0, 9.0, 9.0, 6.0, 5.0, 1.0, 3.0, 1.0, 3.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-27.25, -26.361572265625, -25.47314453125, -24.584716796875, -23.6962890625, -22.807861328125, -21.91943359375, -21.031005859375, -20.142578125, -19.254150390625, -18.36572265625, -17.477294921875, -16.5888671875, -15.700439453125, -14.81201171875, -13.923583984375, -13.03515625, -12.146728515625, -11.25830078125, -10.369873046875, -9.4814453125, -8.593017578125, -7.70458984375, -6.816162109375, -5.927734375, -5.039306640625, -4.15087890625, -3.262451171875, -2.3740234375, -1.485595703125, -0.59716796875, 0.291259765625, 1.1796875, 2.068115234375, 2.95654296875, 3.844970703125, 4.7333984375, 5.621826171875, 6.51025390625, 7.398681640625, 8.287109375, 9.175537109375, 10.06396484375, 10.952392578125, 11.8408203125, 12.729248046875, 13.61767578125, 14.506103515625, 15.39453125, 16.282958984375, 17.17138671875, 18.059814453125, 18.9482421875, 19.836669921875, 20.72509765625, 21.613525390625, 22.501953125, 23.390380859375, 24.27880859375, 25.167236328125, 26.0556640625, 26.944091796875, 27.83251953125, 28.720947265625, 29.609375]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 5.0, 6.0, 6.0, 13.0, 25.0, 34.0, 66.0, 89.0, 108.0, 188.0, 260.0, 425.0, 594.0, 580.0, 526.0, 364.0, 226.0, 184.0, 120.0, 77.0, 51.0, 41.0, 27.0, 22.0, 12.0, 6.0, 13.0, 9.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.203125, -28.4208984375, -27.638671875, -26.8564453125, -26.07421875, -25.2919921875, -24.509765625, -23.7275390625, -22.9453125, -22.1630859375, -21.380859375, -20.5986328125, -19.81640625, -19.0341796875, -18.251953125, -17.4697265625, -16.6875, -15.9052734375, -15.123046875, -14.3408203125, -13.55859375, -12.7763671875, -11.994140625, -11.2119140625, -10.4296875, -9.6474609375, -8.865234375, -8.0830078125, -7.30078125, -6.5185546875, -5.736328125, -4.9541015625, -4.171875, -3.3896484375, -2.607421875, -1.8251953125, -1.04296875, -0.2607421875, 0.521484375, 1.3037109375, 2.0859375, 2.8681640625, 3.650390625, 4.4326171875, 5.21484375, 5.9970703125, 6.779296875, 7.5615234375, 8.34375, 9.1259765625, 9.908203125, 10.6904296875, 11.47265625, 12.2548828125, 13.037109375, 13.8193359375, 14.6015625, 15.3837890625, 16.166015625, 16.9482421875, 17.73046875, 18.5126953125, 19.294921875, 20.0771484375, 20.859375]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 7.0, 3.0, 10.0, 12.0, 24.0, 29.0, 35.0, 47.0, 60.0, 83.0, 126.0, 207.0, 269.0, 463.0, 1130.0, 12744.0, 2952443.0, 1217224.0, 7190.0, 973.0, 409.0, 245.0, 167.0, 129.0, 87.0, 61.0, 38.0, 17.0, 19.0, 10.0, 8.0, 6.0, 4.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.125, -70.3037109375, -67.482421875, -64.6611328125, -61.83984375, -59.0185546875, -56.197265625, -53.3759765625, -50.5546875, -47.7333984375, -44.912109375, -42.0908203125, -39.26953125, -36.4482421875, -33.626953125, -30.8056640625, -27.984375, -25.1630859375, -22.341796875, -19.5205078125, -16.69921875, -13.8779296875, -11.056640625, -8.2353515625, -5.4140625, -2.5927734375, 0.228515625, 3.0498046875, 5.87109375, 8.6923828125, 11.513671875, 14.3349609375, 17.15625, 19.9775390625, 22.798828125, 25.6201171875, 28.44140625, 31.2626953125, 34.083984375, 36.9052734375, 39.7265625, 42.5478515625, 45.369140625, 48.1904296875, 51.01171875, 53.8330078125, 56.654296875, 59.4755859375, 62.296875, 65.1181640625, 67.939453125, 70.7607421875, 73.58203125, 76.4033203125, 79.224609375, 82.0458984375, 84.8671875, 87.6884765625, 90.509765625, 93.3310546875, 96.15234375, 98.9736328125, 101.794921875, 104.6162109375, 107.4375]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 8.0, 17.0, 51.0, 91.0, 161.0, 213.0, 173.0, 132.0, 97.0, 46.0, 17.0, 5.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-78.01551055908203, -73.3468017578125, -68.67809295654297, -64.00938415527344, -59.34068298339844, -54.671974182128906, -50.003265380859375, -45.33456039428711, -40.66585159301758, -35.99714279174805, -31.32843780517578, -26.65972900390625, -21.99102210998535, -17.322315216064453, -12.653606414794922, -7.984901428222656, -3.316192626953125, 1.3525147438049316, 6.021222114562988, 10.689929962158203, 15.358636856079102, 20.02734375, 24.69605255126953, 29.364757537841797, 34.03346633911133, 38.70217514038086, 43.370880126953125, 48.039588928222656, 52.70829772949219, 57.37700271606445, 62.045711517333984, 66.71441650390625, 71.38311767578125, 76.05182647705078, 80.72053527832031, 85.38923645019531, 90.05794525146484, 94.72665405273438, 99.3953628540039, 104.06407165527344, 108.73277282714844, 113.40148162841797, 118.0701904296875, 122.7388916015625, 127.40760040283203, 132.07630920410156, 136.74502563476562, 141.41372680664062, 146.08242797851562, 150.75112915039062, 155.4198455810547, 160.0885467529297, 164.75726318359375, 169.42596435546875, 174.09466552734375, 178.7633819580078, 183.43209838867188, 188.10079956054688, 192.76951599121094, 197.43821716308594, 202.10693359375, 206.775634765625, 211.4443359375, 216.11305236816406, 220.78175354003906]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 2.0, 10.0, 8.0, 6.0, 5.0, 10.0, 17.0, 15.0, 23.0, 18.0, 14.0, 22.0, 20.0, 24.0, 23.0, 31.0, 28.0, 33.0, 43.0, 33.0, 37.0, 42.0, 46.0, 34.0, 39.0, 34.0, 34.0, 46.0, 31.0, 29.0, 25.0, 25.0, 22.0, 25.0, 20.0, 15.0, 13.0, 16.0, 12.0, 11.0, 12.0, 10.0, 8.0, 6.0, 4.0, 6.0, 3.0, 1.0, 2.0, 5.0, 0.0, 3.0, 3.0], "bins": [-59.52677917480469, -57.77389907836914, -56.021018981933594, -54.26813507080078, -52.515254974365234, -50.76237487792969, -49.00949478149414, -47.256614685058594, -45.50373077392578, -43.750850677490234, -41.99797058105469, -40.245086669921875, -38.49220657348633, -36.73932647705078, -34.986446380615234, -33.23356628417969, -31.48068618774414, -29.727806091308594, -27.974924087524414, -26.222043991088867, -24.469161987304688, -22.71628189086914, -20.963401794433594, -19.210521697998047, -17.457639694213867, -15.704758644104004, -13.95187759399414, -12.198997497558594, -10.44611644744873, -8.693235397338867, -6.94035530090332, -5.187474250793457, -3.4345932006835938, -1.6817123889923096, 0.07116842269897461, 1.8240489959716797, 3.576930046081543, 5.329811096191406, 7.082691192626953, 8.835572242736816, 10.58845329284668, 12.341334342956543, 14.094215393066406, 15.847095489501953, 17.5999755859375, 19.35285758972168, 21.105737686157227, 22.858619689941406, 24.611499786376953, 26.3643798828125, 28.11726188659668, 29.870141983032227, 31.623023986816406, 33.37590408325195, 35.1287841796875, 36.88166427612305, 38.634544372558594, 40.38742446899414, 42.14030456542969, 43.8931884765625, 45.64606857299805, 47.398948669433594, 49.15182876586914, 50.90470886230469, 52.6575927734375]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 7.0, 3.0, 2.0, 3.0, 6.0, 1.0, 11.0, 5.0, 3.0, 7.0, 17.0, 13.0, 19.0, 18.0, 22.0, 18.0, 32.0, 18.0, 25.0, 37.0, 26.0, 41.0, 37.0, 36.0, 34.0, 48.0, 51.0, 39.0, 34.0, 32.0, 36.0, 37.0, 40.0, 39.0, 33.0, 23.0, 20.0, 20.0, 21.0, 15.0, 12.0, 14.0, 6.0, 6.0, 5.0, 7.0, 11.0, 5.0, 6.0, 6.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-10.2265625, -9.92724609375, -9.6279296875, -9.32861328125, -9.029296875, -8.72998046875, -8.4306640625, -8.13134765625, -7.83203125, -7.53271484375, -7.2333984375, -6.93408203125, -6.634765625, -6.33544921875, -6.0361328125, -5.73681640625, -5.4375, -5.13818359375, -4.8388671875, -4.53955078125, -4.240234375, -3.94091796875, -3.6416015625, -3.34228515625, -3.04296875, -2.74365234375, -2.4443359375, -2.14501953125, -1.845703125, -1.54638671875, -1.2470703125, -0.94775390625, -0.6484375, -0.34912109375, -0.0498046875, 0.24951171875, 0.548828125, 0.84814453125, 1.1474609375, 1.44677734375, 1.74609375, 2.04541015625, 2.3447265625, 2.64404296875, 2.943359375, 3.24267578125, 3.5419921875, 3.84130859375, 4.140625, 4.43994140625, 4.7392578125, 5.03857421875, 5.337890625, 5.63720703125, 5.9365234375, 6.23583984375, 6.53515625, 6.83447265625, 7.1337890625, 7.43310546875, 7.732421875, 8.03173828125, 8.3310546875, 8.63037109375, 8.9296875]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 4.0, 8.0, 6.0, 9.0, 9.0, 28.0, 25.0, 39.0, 51.0, 94.0, 132.0, 191.0, 307.0, 453.0, 605.0, 908.0, 1362.0, 2038.0, 2965.0, 4665.0, 6832.0, 10098.0, 15352.0, 23033.0, 35487.0, 54227.0, 82471.0, 120331.0, 156877.0, 158810.0, 122880.0, 84688.0, 56088.0, 36368.0, 23768.0, 15763.0, 10506.0, 6834.0, 4777.0, 3131.0, 2015.0, 1423.0, 926.0, 614.0, 429.0, 310.0, 196.0, 132.0, 119.0, 51.0, 38.0, 33.0, 20.0, 19.0, 14.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0], "bins": [-0.72265625, -0.7000961303710938, -0.6775360107421875, -0.6549758911132812, -0.632415771484375, -0.6098556518554688, -0.5872955322265625, -0.5647354125976562, -0.54217529296875, -0.5196151733398438, -0.4970550537109375, -0.47449493408203125, -0.451934814453125, -0.42937469482421875, -0.4068145751953125, -0.38425445556640625, -0.3616943359375, -0.33913421630859375, -0.3165740966796875, -0.29401397705078125, -0.271453857421875, -0.24889373779296875, -0.2263336181640625, -0.20377349853515625, -0.18121337890625, -0.15865325927734375, -0.1360931396484375, -0.11353302001953125, -0.090972900390625, -0.06841278076171875, -0.0458526611328125, -0.02329254150390625, -0.000732421875, 0.02182769775390625, 0.0443878173828125, 0.06694793701171875, 0.089508056640625, 0.11206817626953125, 0.1346282958984375, 0.15718841552734375, 0.17974853515625, 0.20230865478515625, 0.2248687744140625, 0.24742889404296875, 0.269989013671875, 0.29254913330078125, 0.3151092529296875, 0.33766937255859375, 0.3602294921875, 0.38278961181640625, 0.4053497314453125, 0.42790985107421875, 0.450469970703125, 0.47303009033203125, 0.4955902099609375, 0.5181503295898438, 0.54071044921875, 0.5632705688476562, 0.5858306884765625, 0.6083908081054688, 0.630950927734375, 0.6535110473632812, 0.6760711669921875, 0.6986312866210938, 0.72119140625]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 3.0, 7.0, 9.0, 5.0, 14.0, 4.0, 20.0, 17.0, 17.0, 20.0, 28.0, 19.0, 35.0, 30.0, 34.0, 45.0, 30.0, 34.0, 47.0, 38.0, 39.0, 1069.0, 39.0, 34.0, 30.0, 46.0, 36.0, 31.0, 34.0, 37.0, 28.0, 18.0, 19.0, 19.0, 26.0, 11.0, 16.0, 8.0, 7.0, 3.0, 9.0, 7.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.9921875, -5.78045654296875, -5.5687255859375, -5.35699462890625, -5.145263671875, -4.93353271484375, -4.7218017578125, -4.51007080078125, -4.29833984375, -4.08660888671875, -3.8748779296875, -3.66314697265625, -3.451416015625, -3.23968505859375, -3.0279541015625, -2.81622314453125, -2.6044921875, -2.39276123046875, -2.1810302734375, -1.96929931640625, -1.757568359375, -1.54583740234375, -1.3341064453125, -1.12237548828125, -0.91064453125, -0.69891357421875, -0.4871826171875, -0.27545166015625, -0.063720703125, 0.14801025390625, 0.3597412109375, 0.57147216796875, 0.783203125, 0.99493408203125, 1.2066650390625, 1.41839599609375, 1.630126953125, 1.84185791015625, 2.0535888671875, 2.26531982421875, 2.47705078125, 2.68878173828125, 2.9005126953125, 3.11224365234375, 3.323974609375, 3.53570556640625, 3.7474365234375, 3.95916748046875, 4.1708984375, 4.38262939453125, 4.5943603515625, 4.80609130859375, 5.017822265625, 5.22955322265625, 5.4412841796875, 5.65301513671875, 5.86474609375, 6.07647705078125, 6.2882080078125, 6.49993896484375, 6.711669921875, 6.92340087890625, 7.1351318359375, 7.34686279296875, 7.55859375]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 4.0, 11.0, 16.0, 27.0, 37.0, 63.0, 107.0, 150.0, 244.0, 324.0, 594.0, 965.0, 1431.0, 2250.0, 3797.0, 6044.0, 9651.0, 15491.0, 25599.0, 42095.0, 66162.0, 100664.0, 145478.0, 1158324.0, 192850.0, 115920.0, 77638.0, 50158.0, 31040.0, 18987.0, 11714.0, 7248.0, 4583.0, 2763.0, 1739.0, 1123.0, 661.0, 379.0, 260.0, 190.0, 142.0, 71.0, 49.0, 36.0, 21.0, 12.0, 13.0, 9.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.60107421875, -0.5826873779296875, -0.564300537109375, -0.5459136962890625, -0.52752685546875, -0.5091400146484375, -0.490753173828125, -0.4723663330078125, -0.4539794921875, -0.4355926513671875, -0.417205810546875, -0.3988189697265625, -0.38043212890625, -0.3620452880859375, -0.343658447265625, -0.3252716064453125, -0.306884765625, -0.2884979248046875, -0.270111083984375, -0.2517242431640625, -0.23333740234375, -0.2149505615234375, -0.196563720703125, -0.1781768798828125, -0.1597900390625, -0.1414031982421875, -0.123016357421875, -0.1046295166015625, -0.08624267578125, -0.0678558349609375, -0.049468994140625, -0.0310821533203125, -0.0126953125, 0.0056915283203125, 0.024078369140625, 0.0424652099609375, 0.06085205078125, 0.0792388916015625, 0.097625732421875, 0.1160125732421875, 0.1343994140625, 0.1527862548828125, 0.171173095703125, 0.1895599365234375, 0.20794677734375, 0.2263336181640625, 0.244720458984375, 0.2631072998046875, 0.281494140625, 0.2998809814453125, 0.318267822265625, 0.3366546630859375, 0.35504150390625, 0.3734283447265625, 0.391815185546875, 0.4102020263671875, 0.4285888671875, 0.4469757080078125, 0.465362548828125, 0.4837493896484375, 0.50213623046875, 0.5205230712890625, 0.538909912109375, 0.5572967529296875, 0.57568359375]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 1.0, 4.0, 4.0, 1.0, 2.0, 5.0, 6.0, 6.0, 8.0, 8.0, 11.0, 10.0, 9.0, 15.0, 17.0, 27.0, 40.0, 39.0, 47.0, 71.0, 104.0, 99.0, 88.0, 74.0, 75.0, 44.0, 33.0, 30.0, 27.0, 16.0, 18.0, 11.0, 6.0, 6.0, 9.0, 4.0, 4.0, 2.0, 3.0, 2.0, 6.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.0266265869140625, -0.02572035789489746, -0.024814128875732422, -0.023907899856567383, -0.023001670837402344, -0.022095441818237305, -0.021189212799072266, -0.020282983779907227, -0.019376754760742188, -0.01847052574157715, -0.01756429672241211, -0.01665806770324707, -0.01575183868408203, -0.014845609664916992, -0.013939380645751953, -0.013033151626586914, -0.012126922607421875, -0.011220693588256836, -0.010314464569091797, -0.009408235549926758, -0.008502006530761719, -0.00759577751159668, -0.006689548492431641, -0.0057833194732666016, -0.0048770904541015625, -0.0039708614349365234, -0.0030646324157714844, -0.0021584033966064453, -0.0012521743774414062, -0.0003459453582763672, 0.0005602836608886719, 0.001466512680053711, 0.00237274169921875, 0.003278970718383789, 0.004185199737548828, 0.005091428756713867, 0.005997657775878906, 0.006903886795043945, 0.007810115814208984, 0.008716344833374023, 0.009622573852539062, 0.010528802871704102, 0.01143503189086914, 0.01234126091003418, 0.013247489929199219, 0.014153718948364258, 0.015059947967529297, 0.015966176986694336, 0.016872406005859375, 0.017778635025024414, 0.018684864044189453, 0.019591093063354492, 0.02049732208251953, 0.02140355110168457, 0.02230978012084961, 0.02321600914001465, 0.024122238159179688, 0.025028467178344727, 0.025934696197509766, 0.026840925216674805, 0.027747154235839844, 0.028653383255004883, 0.029559612274169922, 0.03046584129333496, 0.0313720703125]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 5.0, 5.0, 5.0, 6.0, 7.0, 4.0, 11.0, 10.0, 17.0, 17.0, 17.0, 28.0, 39.0, 46.0, 99.0, 117.0, 199.0, 336.0, 1174.0, 417350.0, 626916.0, 1214.0, 383.0, 163.0, 95.0, 62.0, 51.0, 33.0, 28.0, 17.0, 8.0, 25.0, 12.0, 9.0, 8.0, 4.0, 7.0, 3.0, 2.0, 2.0, 5.0, 2.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.634765625, -0.61663818359375, -0.5985107421875, -0.58038330078125, -0.562255859375, -0.54412841796875, -0.5260009765625, -0.50787353515625, -0.48974609375, -0.47161865234375, -0.4534912109375, -0.43536376953125, -0.417236328125, -0.39910888671875, -0.3809814453125, -0.36285400390625, -0.3447265625, -0.32659912109375, -0.3084716796875, -0.29034423828125, -0.272216796875, -0.25408935546875, -0.2359619140625, -0.21783447265625, -0.19970703125, -0.18157958984375, -0.1634521484375, -0.14532470703125, -0.127197265625, -0.10906982421875, -0.0909423828125, -0.07281494140625, -0.0546875, -0.03656005859375, -0.0184326171875, -0.00030517578125, 0.017822265625, 0.03594970703125, 0.0540771484375, 0.07220458984375, 0.09033203125, 0.10845947265625, 0.1265869140625, 0.14471435546875, 0.162841796875, 0.18096923828125, 0.1990966796875, 0.21722412109375, 0.2353515625, 0.25347900390625, 0.2716064453125, 0.28973388671875, 0.307861328125, 0.32598876953125, 0.3441162109375, 0.36224365234375, 0.38037109375, 0.39849853515625, 0.4166259765625, 0.43475341796875, 0.452880859375, 0.47100830078125, 0.4891357421875, 0.50726318359375, 0.525390625]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 970.0, 46.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.037553515285253525, -0.02384784072637558, -0.010142166167497635, 0.00356350839138031, 0.017269182950258255, 0.0309748537838459, 0.044680532068014145, 0.05838621035218239, 0.07209187746047974, 0.08579754829406738, 0.09950322657823563, 0.11320890486240387, 0.12691457569599152, 0.14062024652957916, 0.154325932264328, 0.16803160309791565, 0.1817372739315033, 0.19544294476509094, 0.2091486155986786, 0.22285430133342743, 0.23655997216701508, 0.2502656579017639, 0.26397132873535156, 0.2776769995689392, 0.29138267040252686, 0.3050883412361145, 0.31879401206970215, 0.3324996829032898, 0.34620535373687744, 0.3599110245704651, 0.3736167252063751, 0.38732239603996277, 0.4010280966758728, 0.41473376750946045, 0.4284394383430481, 0.44214510917663574, 0.4558507800102234, 0.46955645084381104, 0.48326215147972107, 0.4969678223133087, 0.5106735229492188, 0.5243791937828064, 0.538084864616394, 0.5517905354499817, 0.5654962062835693, 0.579201877117157, 0.5929075479507446, 0.606613278388977, 0.6203188896179199, 0.6340245604515076, 0.6477302312850952, 0.6614359021186829, 0.6751415729522705, 0.6888472437858582, 0.7025529146194458, 0.7162586450576782, 0.7299642562866211, 0.7436699271202087, 0.7573755979537964, 0.771081268787384, 0.7847869396209717, 0.7984926104545593, 0.812198281288147, 0.8259040117263794, 0.839609682559967]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 7.0, 15.0, 23.0, 21.0, 44.0, 38.0, 55.0, 66.0, 72.0, 94.0, 87.0, 78.0, 66.0, 73.0, 76.0, 46.0, 45.0, 22.0, 27.0, 26.0, 11.0, 9.0, 3.0, 6.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03854191303253174, -0.0375216007232666, -0.036501288414001465, -0.03548097237944603, -0.03446066007018089, -0.033440347760915756, -0.03242003172636032, -0.031399719417095184, -0.030379407107830048, -0.02935909479856491, -0.028338780626654625, -0.02731846645474434, -0.026298154145479202, -0.025277841836214066, -0.02425752766430378, -0.023237213492393494, -0.022216901183128357, -0.02119658887386322, -0.020176274701952934, -0.01915596053004265, -0.01813564822077751, -0.017115335911512375, -0.01609502173960209, -0.015074708499014378, -0.014054395258426666, -0.013034082017838955, -0.012013768777251244, -0.010993455536663532, -0.009973142296075821, -0.00895282905548811, -0.007932515814900398, -0.006912202574312687, -0.005891889333724976, -0.004871576093137264, -0.003851262852549553, -0.0028309496119618416, -0.0018106363713741302, -0.0007903231307864189, 0.00022999010980129242, 0.0012503033503890038, 0.002270616590976715, 0.0032909298315644264, 0.004311243072152138, 0.005331556312739849, 0.00635186955332756, 0.007372182793915272, 0.008392496034502983, 0.009412809275090694, 0.010433122515678406, 0.011453435756266117, 0.012473748996853828, 0.01349406223744154, 0.014514375478029251, 0.015534688718616962, 0.016555001959204674, 0.01757531613111496, 0.018595628440380096, 0.019615940749645233, 0.02063625492155552, 0.021656569093465805, 0.022676881402730942, 0.02369719371199608, 0.024717507883906364, 0.02573782205581665, 0.026758134365081787]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 7.0, 3.0, 2.0, 3.0, 6.0, 1.0, 11.0, 5.0, 3.0, 7.0, 17.0, 13.0, 19.0, 18.0, 22.0, 18.0, 32.0, 18.0, 25.0, 37.0, 26.0, 42.0, 36.0, 36.0, 33.0, 49.0, 51.0, 39.0, 34.0, 32.0, 36.0, 37.0, 40.0, 38.0, 34.0, 23.0, 20.0, 20.0, 21.0, 15.0, 12.0, 14.0, 6.0, 6.0, 5.0, 7.0, 11.0, 5.0, 6.0, 6.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-10.2265625, -9.92724609375, -9.6279296875, -9.32861328125, -9.029296875, -8.72998046875, -8.4306640625, -8.13134765625, -7.83203125, -7.53271484375, -7.2333984375, -6.93408203125, -6.634765625, -6.33544921875, -6.0361328125, -5.73681640625, -5.4375, -5.13818359375, -4.8388671875, -4.53955078125, -4.240234375, -3.94091796875, -3.6416015625, -3.34228515625, -3.04296875, -2.74365234375, -2.4443359375, -2.14501953125, -1.845703125, -1.54638671875, -1.2470703125, -0.94775390625, -0.6484375, -0.34912109375, -0.0498046875, 0.24951171875, 0.548828125, 0.84814453125, 1.1474609375, 1.44677734375, 1.74609375, 2.04541015625, 2.3447265625, 2.64404296875, 2.943359375, 3.24267578125, 3.5419921875, 3.84130859375, 4.140625, 4.43994140625, 4.7392578125, 5.03857421875, 5.337890625, 5.63720703125, 5.9365234375, 6.23583984375, 6.53515625, 6.83447265625, 7.1337890625, 7.43310546875, 7.732421875, 8.03173828125, 8.3310546875, 8.63037109375, 8.9296875]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 2.0, 13.0, 10.0, 8.0, 9.0, 8.0, 26.0, 18.0, 30.0, 36.0, 29.0, 65.0, 70.0, 122.0, 163.0, 221.0, 326.0, 516.0, 948.0, 1714.0, 3020.0, 6001.0, 12297.0, 25261.0, 56314.0, 141862.0, 403124.0, 238474.0, 85509.0, 36660.0, 17436.0, 8478.0, 4194.0, 2223.0, 1245.0, 715.0, 419.0, 283.0, 173.0, 144.0, 91.0, 65.0, 53.0, 39.0, 37.0, 27.0, 16.0, 16.0, 12.0, 10.0, 6.0, 11.0, 1.0, 3.0, 4.0, 0.0, 3.0], "bins": [-9.1640625, -8.8924560546875, -8.620849609375, -8.3492431640625, -8.07763671875, -7.8060302734375, -7.534423828125, -7.2628173828125, -6.9912109375, -6.7196044921875, -6.447998046875, -6.1763916015625, -5.90478515625, -5.6331787109375, -5.361572265625, -5.0899658203125, -4.818359375, -4.5467529296875, -4.275146484375, -4.0035400390625, -3.73193359375, -3.4603271484375, -3.188720703125, -2.9171142578125, -2.6455078125, -2.3739013671875, -2.102294921875, -1.8306884765625, -1.55908203125, -1.2874755859375, -1.015869140625, -0.7442626953125, -0.47265625, -0.2010498046875, 0.070556640625, 0.3421630859375, 0.61376953125, 0.8853759765625, 1.156982421875, 1.4285888671875, 1.7001953125, 1.9718017578125, 2.243408203125, 2.5150146484375, 2.78662109375, 3.0582275390625, 3.329833984375, 3.6014404296875, 3.873046875, 4.1446533203125, 4.416259765625, 4.6878662109375, 4.95947265625, 5.2310791015625, 5.502685546875, 5.7742919921875, 6.0458984375, 6.3175048828125, 6.589111328125, 6.8607177734375, 7.13232421875, 7.4039306640625, 7.675537109375, 7.9471435546875, 8.21875]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 10.0, 6.0, 13.0, 9.0, 18.0, 13.0, 20.0, 35.0, 32.0, 40.0, 40.0, 64.0, 49.0, 63.0, 121.0, 1678.0, 357.0, 92.0, 74.0, 61.0, 51.0, 34.0, 32.0, 25.0, 24.0, 25.0, 21.0, 12.0, 13.0, 7.0, 7.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.78125, -36.3193359375, -34.857421875, -33.3955078125, -31.93359375, -30.4716796875, -29.009765625, -27.5478515625, -26.0859375, -24.6240234375, -23.162109375, -21.7001953125, -20.23828125, -18.7763671875, -17.314453125, -15.8525390625, -14.390625, -12.9287109375, -11.466796875, -10.0048828125, -8.54296875, -7.0810546875, -5.619140625, -4.1572265625, -2.6953125, -1.2333984375, 0.228515625, 1.6904296875, 3.15234375, 4.6142578125, 6.076171875, 7.5380859375, 9.0, 10.4619140625, 11.923828125, 13.3857421875, 14.84765625, 16.3095703125, 17.771484375, 19.2333984375, 20.6953125, 22.1572265625, 23.619140625, 25.0810546875, 26.54296875, 28.0048828125, 29.466796875, 30.9287109375, 32.390625, 33.8525390625, 35.314453125, 36.7763671875, 38.23828125, 39.7001953125, 41.162109375, 42.6240234375, 44.0859375, 45.5478515625, 47.009765625, 48.4716796875, 49.93359375, 51.3955078125, 52.857421875, 54.3193359375, 55.78125]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 2.0, 4.0, 4.0, 4.0, 9.0, 24.0, 41.0, 34.0, 57.0, 60.0, 82.0, 145.0, 198.0, 408.0, 1014.0, 10383.0, 3102942.0, 27782.0, 1247.0, 472.0, 237.0, 167.0, 107.0, 80.0, 50.0, 33.0, 36.0, 26.0, 13.0, 10.0, 7.0, 6.0, 5.0, 2.0, 1.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-120.125, -116.5498046875, -112.974609375, -109.3994140625, -105.82421875, -102.2490234375, -98.673828125, -95.0986328125, -91.5234375, -87.9482421875, -84.373046875, -80.7978515625, -77.22265625, -73.6474609375, -70.072265625, -66.4970703125, -62.921875, -59.3466796875, -55.771484375, -52.1962890625, -48.62109375, -45.0458984375, -41.470703125, -37.8955078125, -34.3203125, -30.7451171875, -27.169921875, -23.5947265625, -20.01953125, -16.4443359375, -12.869140625, -9.2939453125, -5.71875, -2.1435546875, 1.431640625, 5.0068359375, 8.58203125, 12.1572265625, 15.732421875, 19.3076171875, 22.8828125, 26.4580078125, 30.033203125, 33.6083984375, 37.18359375, 40.7587890625, 44.333984375, 47.9091796875, 51.484375, 55.0595703125, 58.634765625, 62.2099609375, 65.78515625, 69.3603515625, 72.935546875, 76.5107421875, 80.0859375, 83.6611328125, 87.236328125, 90.8115234375, 94.38671875, 97.9619140625, 101.537109375, 105.1123046875, 108.6875]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 32.0, 177.0, 382.0, 335.0, 81.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-224.1649627685547, -219.47555541992188, -214.7861328125, -210.0967254638672, -205.4073028564453, -200.7178955078125, -196.02847290039062, -191.3390655517578, -186.649658203125, -181.9602508544922, -177.2708282470703, -172.5814208984375, -167.89199829101562, -163.2025909423828, -158.51316833496094, -153.82376098632812, -149.13433837890625, -144.44493103027344, -139.75550842285156, -135.06610107421875, -130.37667846679688, -125.68727111816406, -120.99785614013672, -116.30844116210938, -111.61902618408203, -106.92961120605469, -102.24019622802734, -97.55078125, -92.86137390136719, -88.17195129394531, -83.4825439453125, -78.79312896728516, -74.10370635986328, -69.41429138183594, -64.7248764038086, -60.035465240478516, -55.34605026245117, -50.65663528442383, -45.96722412109375, -41.277809143066406, -36.58839416503906, -31.89897918701172, -27.209566116333008, -22.520153045654297, -17.830738067626953, -13.14132308959961, -8.451910018920898, -3.7624969482421875, 0.9269180297851562, 5.616332054138184, 10.305746078491211, 14.995160102844238, 19.684574127197266, 24.37398910522461, 29.06340217590332, 33.75281524658203, 38.442230224609375, 43.13164520263672, 47.82106018066406, 52.51047134399414, 57.199886322021484, 61.88930130004883, 66.5787124633789, 71.26812744140625, 75.9575424194336]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 4.0, 1.0, 5.0, 4.0, 2.0, 9.0, 8.0, 11.0, 10.0, 11.0, 15.0, 19.0, 28.0, 17.0, 27.0, 29.0, 27.0, 26.0, 29.0, 37.0, 35.0, 43.0, 52.0, 38.0, 39.0, 38.0, 40.0, 42.0, 34.0, 37.0, 28.0, 25.0, 23.0, 34.0, 30.0, 31.0, 22.0, 19.0, 11.0, 10.0, 8.0, 10.0, 9.0, 7.0, 7.0, 3.0, 8.0, 3.0, 3.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-85.33950805664062, -82.64139556884766, -79.94328308105469, -77.24516296386719, -74.54705047607422, -71.84893798828125, -69.15081787109375, -66.45270538330078, -63.75459289550781, -61.056480407714844, -58.35836410522461, -55.660247802734375, -52.962135314941406, -50.26402282714844, -47.5659065246582, -44.86779022216797, -42.169677734375, -39.47156524658203, -36.7734489440918, -34.07533264160156, -31.377220153808594, -28.679105758666992, -25.98099136352539, -23.28287696838379, -20.584762573242188, -17.886648178100586, -15.188533782958984, -12.490419387817383, -9.792304992675781, -7.09419059753418, -4.396076202392578, -1.6979618072509766, 1.000152587890625, 3.6982669830322266, 6.396381378173828, 9.09449577331543, 11.792610168457031, 14.490724563598633, 17.188838958740234, 19.886953353881836, 22.585067749023438, 25.28318214416504, 27.98129653930664, 30.679410934448242, 33.377525329589844, 36.07563781738281, 38.77375411987305, 41.47187042236328, 44.16998291015625, 46.86809539794922, 49.56621170043945, 52.26432800292969, 54.962440490722656, 57.660552978515625, 60.35866928100586, 63.056785583496094, 65.75489807128906, 68.45301055908203, 71.151123046875, 73.8492431640625, 76.54735565185547, 79.24546813964844, 81.94358825683594, 84.6417007446289, 87.33981323242188]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 4.0, 3.0, 4.0, 8.0, 9.0, 6.0, 4.0, 5.0, 10.0, 18.0, 13.0, 24.0, 19.0, 22.0, 29.0, 21.0, 27.0, 39.0, 31.0, 35.0, 33.0, 48.0, 35.0, 34.0, 39.0, 47.0, 40.0, 27.0, 26.0, 44.0, 37.0, 30.0, 34.0, 35.0, 25.0, 14.0, 20.0, 21.0, 13.0, 9.0, 8.0, 7.0, 10.0, 6.0, 10.0, 2.0, 5.0, 5.0, 5.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-10.140625, -9.8258056640625, -9.510986328125, -9.1961669921875, -8.88134765625, -8.5665283203125, -8.251708984375, -7.9368896484375, -7.6220703125, -7.3072509765625, -6.992431640625, -6.6776123046875, -6.36279296875, -6.0479736328125, -5.733154296875, -5.4183349609375, -5.103515625, -4.7886962890625, -4.473876953125, -4.1590576171875, -3.84423828125, -3.5294189453125, -3.214599609375, -2.8997802734375, -2.5849609375, -2.2701416015625, -1.955322265625, -1.6405029296875, -1.32568359375, -1.0108642578125, -0.696044921875, -0.3812255859375, -0.06640625, 0.2484130859375, 0.563232421875, 0.8780517578125, 1.19287109375, 1.5076904296875, 1.822509765625, 2.1373291015625, 2.4521484375, 2.7669677734375, 3.081787109375, 3.3966064453125, 3.71142578125, 4.0262451171875, 4.341064453125, 4.6558837890625, 4.970703125, 5.2855224609375, 5.600341796875, 5.9151611328125, 6.22998046875, 6.5447998046875, 6.859619140625, 7.1744384765625, 7.4892578125, 7.8040771484375, 8.118896484375, 8.4337158203125, 8.74853515625, 9.0633544921875, 9.378173828125, 9.6929931640625, 10.0078125]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 5.0, 2.0, 6.0, 6.0, 9.0, 10.0, 11.0, 13.0, 18.0, 27.0, 24.0, 34.0, 35.0, 50.0, 94.0, 123.0, 219.0, 471.0, 1151.0, 4150.0, 22884.0, 325074.0, 3072030.0, 719425.0, 39679.0, 5826.0, 1536.0, 579.0, 254.0, 148.0, 98.0, 62.0, 51.0, 28.0, 26.0, 22.0, 13.0, 18.0, 11.0, 12.0, 9.0, 8.0, 9.0, 1.0, 7.0, 4.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0], "bins": [-32.84375, -31.866943359375, -30.89013671875, -29.913330078125, -28.9365234375, -27.959716796875, -26.98291015625, -26.006103515625, -25.029296875, -24.052490234375, -23.07568359375, -22.098876953125, -21.1220703125, -20.145263671875, -19.16845703125, -18.191650390625, -17.21484375, -16.238037109375, -15.26123046875, -14.284423828125, -13.3076171875, -12.330810546875, -11.35400390625, -10.377197265625, -9.400390625, -8.423583984375, -7.44677734375, -6.469970703125, -5.4931640625, -4.516357421875, -3.53955078125, -2.562744140625, -1.5859375, -0.609130859375, 0.36767578125, 1.344482421875, 2.3212890625, 3.298095703125, 4.27490234375, 5.251708984375, 6.228515625, 7.205322265625, 8.18212890625, 9.158935546875, 10.1357421875, 11.112548828125, 12.08935546875, 13.066162109375, 14.04296875, 15.019775390625, 15.99658203125, 16.973388671875, 17.9501953125, 18.927001953125, 19.90380859375, 20.880615234375, 21.857421875, 22.834228515625, 23.81103515625, 24.787841796875, 25.7646484375, 26.741455078125, 27.71826171875, 28.695068359375, 29.671875]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 7.0, 5.0, 9.0, 19.0, 25.0, 26.0, 48.0, 58.0, 58.0, 104.0, 145.0, 240.0, 341.0, 493.0, 583.0, 543.0, 425.0, 268.0, 202.0, 138.0, 115.0, 85.0, 40.0, 27.0, 21.0, 21.0, 9.0, 9.0, 8.0, 3.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-28.765625, -28.060546875, -27.35546875, -26.650390625, -25.9453125, -25.240234375, -24.53515625, -23.830078125, -23.125, -22.419921875, -21.71484375, -21.009765625, -20.3046875, -19.599609375, -18.89453125, -18.189453125, -17.484375, -16.779296875, -16.07421875, -15.369140625, -14.6640625, -13.958984375, -13.25390625, -12.548828125, -11.84375, -11.138671875, -10.43359375, -9.728515625, -9.0234375, -8.318359375, -7.61328125, -6.908203125, -6.203125, -5.498046875, -4.79296875, -4.087890625, -3.3828125, -2.677734375, -1.97265625, -1.267578125, -0.5625, 0.142578125, 0.84765625, 1.552734375, 2.2578125, 2.962890625, 3.66796875, 4.373046875, 5.078125, 5.783203125, 6.48828125, 7.193359375, 7.8984375, 8.603515625, 9.30859375, 10.013671875, 10.71875, 11.423828125, 12.12890625, 12.833984375, 13.5390625, 14.244140625, 14.94921875, 15.654296875, 16.359375]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 3.0, 3.0, 3.0, 3.0, 7.0, 7.0, 14.0, 19.0, 24.0, 31.0, 50.0, 73.0, 108.0, 154.0, 205.0, 269.0, 506.0, 1551.0, 37557.0, 3937017.0, 211759.0, 3227.0, 610.0, 338.0, 235.0, 140.0, 103.0, 80.0, 53.0, 36.0, 26.0, 24.0, 28.0, 9.0, 9.0, 3.0, 4.0, 6.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-79.625, -76.5224609375, -73.419921875, -70.3173828125, -67.21484375, -64.1123046875, -61.009765625, -57.9072265625, -54.8046875, -51.7021484375, -48.599609375, -45.4970703125, -42.39453125, -39.2919921875, -36.189453125, -33.0869140625, -29.984375, -26.8818359375, -23.779296875, -20.6767578125, -17.57421875, -14.4716796875, -11.369140625, -8.2666015625, -5.1640625, -2.0615234375, 1.041015625, 4.1435546875, 7.24609375, 10.3486328125, 13.451171875, 16.5537109375, 19.65625, 22.7587890625, 25.861328125, 28.9638671875, 32.06640625, 35.1689453125, 38.271484375, 41.3740234375, 44.4765625, 47.5791015625, 50.681640625, 53.7841796875, 56.88671875, 59.9892578125, 63.091796875, 66.1943359375, 69.296875, 72.3994140625, 75.501953125, 78.6044921875, 81.70703125, 84.8095703125, 87.912109375, 91.0146484375, 94.1171875, 97.2197265625, 100.322265625, 103.4248046875, 106.52734375, 109.6298828125, 112.732421875, 115.8349609375, 118.9375]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 11.0, 17.0, 26.0, 54.0, 97.0, 135.0, 143.0, 164.0, 113.0, 94.0, 71.0, 31.0, 30.0, 16.0, 5.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-177.62815856933594, -174.0123748779297, -170.39659118652344, -166.7808074951172, -163.16502380371094, -159.5492401123047, -155.93345642089844, -152.3176727294922, -148.70188903808594, -145.0861053466797, -141.47032165527344, -137.8545379638672, -134.23875427246094, -130.6229705810547, -127.00718688964844, -123.39140319824219, -119.77562713623047, -116.15984344482422, -112.54405975341797, -108.92827606201172, -105.31249237060547, -101.69670867919922, -98.0809326171875, -94.46514892578125, -90.849365234375, -87.23358154296875, -83.6177978515625, -80.00201416015625, -76.38623046875, -72.77044677734375, -69.1546630859375, -65.53887939453125, -61.923099517822266, -58.307315826416016, -54.691532135009766, -51.07575225830078, -47.45996856689453, -43.84418487548828, -40.22840118408203, -36.61261749267578, -32.99683380126953, -29.38105010986328, -25.76526641845703, -22.149484634399414, -18.533700942993164, -14.917917251586914, -11.302135467529297, -7.686351776123047, -4.070568084716797, -0.4547848701477051, 3.1609983444213867, 6.77678108215332, 10.39256477355957, 14.00834846496582, 17.624130249023438, 21.239913940429688, 24.855697631835938, 28.471481323242188, 32.08726501464844, 35.70304870605469, 39.31883239746094, 42.93461608886719, 46.55039596557617, 50.16617965698242, 53.78196334838867]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 1.0, 2.0, 5.0, 6.0, 6.0, 7.0, 7.0, 8.0, 7.0, 11.0, 10.0, 16.0, 19.0, 21.0, 24.0, 30.0, 28.0, 31.0, 39.0, 36.0, 39.0, 38.0, 19.0, 45.0, 31.0, 35.0, 33.0, 37.0, 34.0, 46.0, 34.0, 28.0, 29.0, 32.0, 24.0, 22.0, 20.0, 22.0, 23.0, 15.0, 16.0, 12.0, 15.0, 7.0, 11.0, 7.0, 2.0, 6.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-54.229827880859375, -52.40794372558594, -50.586063385009766, -48.76417922973633, -46.942298889160156, -45.12041473388672, -43.29853057861328, -41.476646423339844, -39.65476608276367, -37.832881927490234, -36.01100158691406, -34.189117431640625, -32.36723327636719, -30.545352935791016, -28.723468780517578, -26.901586532592773, -25.07970428466797, -23.257822036743164, -21.43593978881836, -19.614055633544922, -17.792173385620117, -15.970291137695312, -14.148407936096191, -12.32652473449707, -10.504642486572266, -8.682760238647461, -6.86087703704834, -5.038994312286377, -3.217111587524414, -1.3952293395996094, 0.4266538619995117, 2.248537063598633, 4.0704193115234375, 5.8923020362854, 7.714184761047363, 9.536067962646484, 11.357950210571289, 13.179832458496094, 15.001715660095215, 16.823598861694336, 18.64548110961914, 20.467363357543945, 22.28924560546875, 24.111129760742188, 25.933012008666992, 27.754894256591797, 29.576778411865234, 31.39866065979004, 33.220542907714844, 35.04242706298828, 36.86430740356445, 38.68619155883789, 40.50807189941406, 42.3299560546875, 44.15184020996094, 45.973724365234375, 47.79560470581055, 49.617488861083984, 51.439369201660156, 53.261253356933594, 55.08313751220703, 56.9050178527832, 58.72690200805664, 60.54878234863281, 62.37066650390625]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 7.0, 9.0, 9.0, 9.0, 16.0, 10.0, 11.0, 10.0, 16.0, 14.0, 19.0, 24.0, 24.0, 23.0, 33.0, 30.0, 31.0, 31.0, 32.0, 43.0, 48.0, 40.0, 28.0, 43.0, 33.0, 40.0, 39.0, 28.0, 26.0, 22.0, 25.0, 26.0, 33.0, 27.0, 17.0, 17.0, 14.0, 21.0, 16.0, 9.0, 10.0, 8.0, 10.0, 4.0, 5.0, 2.0, 1.0, 6.0, 2.0, 3.0, 3.0, 2.0], "bins": [-10.4921875, -10.1881103515625, -9.884033203125, -9.5799560546875, -9.27587890625, -8.9718017578125, -8.667724609375, -8.3636474609375, -8.0595703125, -7.7554931640625, -7.451416015625, -7.1473388671875, -6.84326171875, -6.5391845703125, -6.235107421875, -5.9310302734375, -5.626953125, -5.3228759765625, -5.018798828125, -4.7147216796875, -4.41064453125, -4.1065673828125, -3.802490234375, -3.4984130859375, -3.1943359375, -2.8902587890625, -2.586181640625, -2.2821044921875, -1.97802734375, -1.6739501953125, -1.369873046875, -1.0657958984375, -0.76171875, -0.4576416015625, -0.153564453125, 0.1505126953125, 0.45458984375, 0.7586669921875, 1.062744140625, 1.3668212890625, 1.6708984375, 1.9749755859375, 2.279052734375, 2.5831298828125, 2.88720703125, 3.1912841796875, 3.495361328125, 3.7994384765625, 4.103515625, 4.4075927734375, 4.711669921875, 5.0157470703125, 5.31982421875, 5.6239013671875, 5.927978515625, 6.2320556640625, 6.5361328125, 6.8402099609375, 7.144287109375, 7.4483642578125, 7.75244140625, 8.0565185546875, 8.360595703125, 8.6646728515625, 8.96875]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 7.0, 15.0, 14.0, 26.0, 62.0, 83.0, 148.0, 207.0, 341.0, 525.0, 861.0, 1491.0, 2168.0, 3548.0, 5709.0, 9201.0, 14746.0, 23382.0, 38279.0, 61422.0, 98758.0, 149034.0, 185885.0, 160084.0, 109767.0, 69978.0, 42758.0, 26571.0, 16438.0, 10179.0, 6227.0, 3896.0, 2525.0, 1637.0, 979.0, 582.0, 401.0, 237.0, 144.0, 80.0, 53.0, 33.0, 27.0, 25.0, 12.0, 7.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.95263671875, -0.9243011474609375, -0.895965576171875, -0.8676300048828125, -0.83929443359375, -0.8109588623046875, -0.782623291015625, -0.7542877197265625, -0.7259521484375, -0.6976165771484375, -0.669281005859375, -0.6409454345703125, -0.61260986328125, -0.5842742919921875, -0.555938720703125, -0.5276031494140625, -0.499267578125, -0.4709320068359375, -0.442596435546875, -0.4142608642578125, -0.38592529296875, -0.3575897216796875, -0.329254150390625, -0.3009185791015625, -0.2725830078125, -0.2442474365234375, -0.215911865234375, -0.1875762939453125, -0.15924072265625, -0.1309051513671875, -0.102569580078125, -0.0742340087890625, -0.0458984375, -0.0175628662109375, 0.010772705078125, 0.0391082763671875, 0.06744384765625, 0.0957794189453125, 0.124114990234375, 0.1524505615234375, 0.1807861328125, 0.2091217041015625, 0.237457275390625, 0.2657928466796875, 0.29412841796875, 0.3224639892578125, 0.350799560546875, 0.3791351318359375, 0.407470703125, 0.4358062744140625, 0.464141845703125, 0.4924774169921875, 0.52081298828125, 0.5491485595703125, 0.577484130859375, 0.6058197021484375, 0.6341552734375, 0.6624908447265625, 0.690826416015625, 0.7191619873046875, 0.74749755859375, 0.7758331298828125, 0.804168701171875, 0.8325042724609375, 0.86083984375]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 9.0, 6.0, 14.0, 9.0, 11.0, 19.0, 16.0, 29.0, 13.0, 29.0, 28.0, 30.0, 37.0, 38.0, 41.0, 53.0, 33.0, 37.0, 1066.0, 45.0, 50.0, 56.0, 35.0, 61.0, 39.0, 23.0, 35.0, 28.0, 21.0, 22.0, 20.0, 17.0, 8.0, 8.0, 9.0, 6.0, 8.0, 8.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.65234375, -6.40899658203125, -6.1656494140625, -5.92230224609375, -5.678955078125, -5.43560791015625, -5.1922607421875, -4.94891357421875, -4.70556640625, -4.46221923828125, -4.2188720703125, -3.97552490234375, -3.732177734375, -3.48883056640625, -3.2454833984375, -3.00213623046875, -2.7587890625, -2.51544189453125, -2.2720947265625, -2.02874755859375, -1.785400390625, -1.54205322265625, -1.2987060546875, -1.05535888671875, -0.81201171875, -0.56866455078125, -0.3253173828125, -0.08197021484375, 0.161376953125, 0.40472412109375, 0.6480712890625, 0.89141845703125, 1.134765625, 1.37811279296875, 1.6214599609375, 1.86480712890625, 2.108154296875, 2.35150146484375, 2.5948486328125, 2.83819580078125, 3.08154296875, 3.32489013671875, 3.5682373046875, 3.81158447265625, 4.054931640625, 4.29827880859375, 4.5416259765625, 4.78497314453125, 5.0283203125, 5.27166748046875, 5.5150146484375, 5.75836181640625, 6.001708984375, 6.24505615234375, 6.4884033203125, 6.73175048828125, 6.97509765625, 7.21844482421875, 7.4617919921875, 7.70513916015625, 7.948486328125, 8.19183349609375, 8.4351806640625, 8.67852783203125, 8.921875]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 6.0, 8.0, 15.0, 23.0, 35.0, 44.0, 68.0, 101.0, 158.0, 282.0, 455.0, 688.0, 1146.0, 1753.0, 2910.0, 4662.0, 7631.0, 12935.0, 21366.0, 36009.0, 59050.0, 94407.0, 142707.0, 1069644.0, 304076.0, 126247.0, 81954.0, 51015.0, 30837.0, 18244.0, 10993.0, 6767.0, 4101.0, 2563.0, 1596.0, 972.0, 594.0, 364.0, 254.0, 153.0, 106.0, 57.0, 46.0, 27.0, 27.0, 10.0, 7.0, 7.0, 6.0, 3.0, 6.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.658203125, -0.6381683349609375, -0.618133544921875, -0.5980987548828125, -0.57806396484375, -0.5580291748046875, -0.537994384765625, -0.5179595947265625, -0.4979248046875, -0.4778900146484375, -0.457855224609375, -0.4378204345703125, -0.41778564453125, -0.3977508544921875, -0.377716064453125, -0.3576812744140625, -0.337646484375, -0.3176116943359375, -0.297576904296875, -0.2775421142578125, -0.25750732421875, -0.2374725341796875, -0.217437744140625, -0.1974029541015625, -0.1773681640625, -0.1573333740234375, -0.137298583984375, -0.1172637939453125, -0.09722900390625, -0.0771942138671875, -0.057159423828125, -0.0371246337890625, -0.01708984375, 0.0029449462890625, 0.022979736328125, 0.0430145263671875, 0.06304931640625, 0.0830841064453125, 0.103118896484375, 0.1231536865234375, 0.1431884765625, 0.1632232666015625, 0.183258056640625, 0.2032928466796875, 0.22332763671875, 0.2433624267578125, 0.263397216796875, 0.2834320068359375, 0.303466796875, 0.3235015869140625, 0.343536376953125, 0.3635711669921875, 0.38360595703125, 0.4036407470703125, 0.423675537109375, 0.4437103271484375, 0.4637451171875, 0.4837799072265625, 0.503814697265625, 0.5238494873046875, 0.54388427734375, 0.5639190673828125, 0.583953857421875, 0.6039886474609375, 0.6240234375]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 4.0, 3.0, 3.0, 7.0, 9.0, 8.0, 13.0, 14.0, 15.0, 12.0, 21.0, 16.0, 17.0, 13.0, 19.0, 18.0, 22.0, 34.0, 64.0, 95.0, 113.0, 97.0, 104.0, 59.0, 36.0, 17.0, 28.0, 14.0, 21.0, 15.0, 11.0, 13.0, 11.0, 14.0, 11.0, 12.0, 7.0, 3.0, 4.0, 3.0, 3.0, 2.0, 2.0, 5.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.036102294921875, -0.0350041389465332, -0.033905982971191406, -0.03280782699584961, -0.03170967102050781, -0.030611515045166016, -0.02951335906982422, -0.028415203094482422, -0.027317047119140625, -0.026218891143798828, -0.02512073516845703, -0.024022579193115234, -0.022924423217773438, -0.02182626724243164, -0.020728111267089844, -0.019629955291748047, -0.01853179931640625, -0.017433643341064453, -0.016335487365722656, -0.01523733139038086, -0.014139175415039062, -0.013041019439697266, -0.011942863464355469, -0.010844707489013672, -0.009746551513671875, -0.008648395538330078, -0.007550239562988281, -0.006452083587646484, -0.0053539276123046875, -0.004255771636962891, -0.0031576156616210938, -0.002059459686279297, -0.0009613037109375, 0.00013685226440429688, 0.0012350082397460938, 0.0023331642150878906, 0.0034313201904296875, 0.004529476165771484, 0.005627632141113281, 0.006725788116455078, 0.007823944091796875, 0.008922100067138672, 0.010020256042480469, 0.011118412017822266, 0.012216567993164062, 0.01331472396850586, 0.014412879943847656, 0.015511035919189453, 0.01660919189453125, 0.017707347869873047, 0.018805503845214844, 0.01990365982055664, 0.021001815795898438, 0.022099971771240234, 0.02319812774658203, 0.024296283721923828, 0.025394439697265625, 0.026492595672607422, 0.02759075164794922, 0.028688907623291016, 0.029787063598632812, 0.03088521957397461, 0.031983375549316406, 0.0330815315246582, 0.0341796875]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 6.0, 1.0, 2.0, 1.0, 5.0, 3.0, 2.0, 6.0, 8.0, 11.0, 16.0, 12.0, 17.0, 27.0, 27.0, 26.0, 28.0, 34.0, 53.0, 77.0, 122.0, 257.0, 506.0, 2630.0, 966184.0, 76551.0, 944.0, 381.0, 173.0, 87.0, 67.0, 52.0, 45.0, 31.0, 26.0, 25.0, 32.0, 15.0, 19.0, 17.0, 9.0, 4.0, 8.0, 9.0, 4.0, 4.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.69384765625, -0.672027587890625, -0.65020751953125, -0.628387451171875, -0.6065673828125, -0.584747314453125, -0.56292724609375, -0.541107177734375, -0.519287109375, -0.497467041015625, -0.47564697265625, -0.453826904296875, -0.4320068359375, -0.410186767578125, -0.38836669921875, -0.366546630859375, -0.3447265625, -0.322906494140625, -0.30108642578125, -0.279266357421875, -0.2574462890625, -0.235626220703125, -0.21380615234375, -0.191986083984375, -0.170166015625, -0.148345947265625, -0.12652587890625, -0.104705810546875, -0.0828857421875, -0.061065673828125, -0.03924560546875, -0.017425537109375, 0.00439453125, 0.026214599609375, 0.04803466796875, 0.069854736328125, 0.0916748046875, 0.113494873046875, 0.13531494140625, 0.157135009765625, 0.178955078125, 0.200775146484375, 0.22259521484375, 0.244415283203125, 0.2662353515625, 0.288055419921875, 0.30987548828125, 0.331695556640625, 0.353515625, 0.375335693359375, 0.39715576171875, 0.418975830078125, 0.4407958984375, 0.462615966796875, 0.48443603515625, 0.506256103515625, 0.528076171875, 0.549896240234375, 0.57171630859375, 0.593536376953125, 0.6153564453125, 0.637176513671875, 0.65899658203125, 0.680816650390625, 0.70263671875]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 1001.0, 11.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06556237488985062, -0.046912312507629395, -0.028262246400117874, -0.009612180292606354, 0.009037882089614868, 0.02768794447183609, 0.04633801430463791, 0.06498806923627853, 0.08363813906908035, 0.10228820145130157, 0.1209382712841034, 0.13958832621574402, 0.15823839604854584, 0.17688846588134766, 0.19553852081298828, 0.2141885757446289, 0.23283866047859192, 0.25148871541023254, 0.27013880014419556, 0.2887888550758362, 0.3074389100074768, 0.32608896493911743, 0.34473904967308044, 0.36338910460472107, 0.3820391595363617, 0.4006892144680023, 0.41933929920196533, 0.43798935413360596, 0.4566394090652466, 0.4752894639968872, 0.4939395487308502, 0.5125895738601685, 0.5312396883964539, 0.5498897433280945, 0.5685397982597351, 0.5871899127960205, 0.6058399677276611, 0.6244900226593018, 0.6431400775909424, 0.661790132522583, 0.6804401874542236, 0.6990902423858643, 0.7177402973175049, 0.7363903522491455, 0.7550404667854309, 0.7736905217170715, 0.7923405766487122, 0.8109906315803528, 0.8296407461166382, 0.8482908010482788, 0.8669408559799194, 0.8855909109115601, 0.9042410254478455, 0.9228910803794861, 0.9415411353111267, 0.9601911902427673, 0.978841245174408, 0.9974913001060486, 1.016141414642334, 1.0347914695739746, 1.0534415245056152, 1.0720915794372559, 1.0907416343688965, 1.109391689300537, 1.1280417442321777]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 5.0, 12.0, 17.0, 22.0, 37.0, 44.0, 54.0, 68.0, 82.0, 84.0, 107.0, 86.0, 87.0, 75.0, 53.0, 53.0, 32.0, 37.0, 20.0, 10.0, 7.0, 7.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05605518817901611, -0.054511141031980515, -0.052967093884944916, -0.051423050463199615, -0.04987900331616402, -0.04833495616912842, -0.04679091274738312, -0.04524686560034752, -0.04370281845331192, -0.04215877130627632, -0.04061472415924072, -0.03907068073749542, -0.037526633590459824, -0.035982586443424225, -0.034438543021678925, -0.032894495874643326, -0.03135044872760773, -0.02980640158057213, -0.02826235629618168, -0.02671831101179123, -0.02517426386475563, -0.023630216717720032, -0.022086171433329582, -0.020542126148939133, -0.018998079001903534, -0.017454031854867935, -0.015909986570477486, -0.014365940354764462, -0.012821894139051437, -0.011277847923338413, -0.009733801707625389, -0.008189755491912365, -0.006645709276199341, -0.005101663060486317, -0.0035576168447732925, -0.0020135706290602684, -0.00046952441334724426, 0.0010745218023657799, 0.002618568018078804, 0.004162614233791828, 0.005706660449504852, 0.0072507066652178764, 0.0087947528809309, 0.010338799096643925, 0.011882845312356949, 0.013426891528069973, 0.014970937743782997, 0.016514983028173447, 0.018059030175209045, 0.019603077322244644, 0.021147122606635094, 0.022691167891025543, 0.024235215038061142, 0.02577926218509674, 0.02732330746948719, 0.02886735275387764, 0.03041139990091324, 0.03195544704794884, 0.033499494194984436, 0.035043537616729736, 0.036587584763765335, 0.038131631910800934, 0.039675675332546234, 0.04121972247958183, 0.04276376962661743]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 7.0, 8.0, 10.0, 9.0, 16.0, 10.0, 12.0, 9.0, 16.0, 14.0, 20.0, 23.0, 24.0, 23.0, 33.0, 30.0, 32.0, 30.0, 32.0, 43.0, 48.0, 40.0, 28.0, 43.0, 33.0, 40.0, 39.0, 28.0, 26.0, 22.0, 25.0, 25.0, 34.0, 27.0, 16.0, 18.0, 14.0, 21.0, 16.0, 9.0, 10.0, 8.0, 11.0, 3.0, 5.0, 2.0, 1.0, 6.0, 2.0, 3.0, 3.0, 2.0], "bins": [-10.4921875, -10.1881103515625, -9.884033203125, -9.5799560546875, -9.27587890625, -8.9718017578125, -8.667724609375, -8.3636474609375, -8.0595703125, -7.7554931640625, -7.451416015625, -7.1473388671875, -6.84326171875, -6.5391845703125, -6.235107421875, -5.9310302734375, -5.626953125, -5.3228759765625, -5.018798828125, -4.7147216796875, -4.41064453125, -4.1065673828125, -3.802490234375, -3.4984130859375, -3.1943359375, -2.8902587890625, -2.586181640625, -2.2821044921875, -1.97802734375, -1.6739501953125, -1.369873046875, -1.0657958984375, -0.76171875, -0.4576416015625, -0.153564453125, 0.1505126953125, 0.45458984375, 0.7586669921875, 1.062744140625, 1.3668212890625, 1.6708984375, 1.9749755859375, 2.279052734375, 2.5831298828125, 2.88720703125, 3.1912841796875, 3.495361328125, 3.7994384765625, 4.103515625, 4.4075927734375, 4.711669921875, 5.0157470703125, 5.31982421875, 5.6239013671875, 5.927978515625, 6.2320556640625, 6.5361328125, 6.8402099609375, 7.144287109375, 7.4483642578125, 7.75244140625, 8.0565185546875, 8.360595703125, 8.6646728515625, 8.96875]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 5.0, 8.0, 13.0, 7.0, 12.0, 19.0, 16.0, 21.0, 25.0, 35.0, 51.0, 63.0, 99.0, 140.0, 176.0, 318.0, 537.0, 988.0, 1815.0, 3848.0, 9291.0, 29635.0, 121383.0, 663482.0, 160336.0, 36017.0, 11202.0, 4312.0, 1950.0, 1033.0, 597.0, 359.0, 208.0, 141.0, 102.0, 71.0, 55.0, 47.0, 35.0, 21.0, 17.0, 12.0, 14.0, 18.0, 5.0, 6.0, 2.0, 1.0, 6.0, 2.0, 3.0, 4.0, 1.0], "bins": [-18.546875, -18.010498046875, -17.47412109375, -16.937744140625, -16.4013671875, -15.864990234375, -15.32861328125, -14.792236328125, -14.255859375, -13.719482421875, -13.18310546875, -12.646728515625, -12.1103515625, -11.573974609375, -11.03759765625, -10.501220703125, -9.96484375, -9.428466796875, -8.89208984375, -8.355712890625, -7.8193359375, -7.282958984375, -6.74658203125, -6.210205078125, -5.673828125, -5.137451171875, -4.60107421875, -4.064697265625, -3.5283203125, -2.991943359375, -2.45556640625, -1.919189453125, -1.3828125, -0.846435546875, -0.31005859375, 0.226318359375, 0.7626953125, 1.299072265625, 1.83544921875, 2.371826171875, 2.908203125, 3.444580078125, 3.98095703125, 4.517333984375, 5.0537109375, 5.590087890625, 6.12646484375, 6.662841796875, 7.19921875, 7.735595703125, 8.27197265625, 8.808349609375, 9.3447265625, 9.881103515625, 10.41748046875, 10.953857421875, 11.490234375, 12.026611328125, 12.56298828125, 13.099365234375, 13.6357421875, 14.172119140625, 14.70849609375, 15.244873046875, 15.78125]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 7.0, 3.0, 8.0, 6.0, 12.0, 11.0, 7.0, 15.0, 22.0, 31.0, 20.0, 29.0, 33.0, 37.0, 33.0, 43.0, 50.0, 64.0, 122.0, 1729.0, 252.0, 81.0, 57.0, 44.0, 49.0, 45.0, 46.0, 28.0, 32.0, 26.0, 16.0, 23.0, 17.0, 11.0, 8.0, 9.0, 5.0, 6.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-34.84375, -33.6318359375, -32.419921875, -31.2080078125, -29.99609375, -28.7841796875, -27.572265625, -26.3603515625, -25.1484375, -23.9365234375, -22.724609375, -21.5126953125, -20.30078125, -19.0888671875, -17.876953125, -16.6650390625, -15.453125, -14.2412109375, -13.029296875, -11.8173828125, -10.60546875, -9.3935546875, -8.181640625, -6.9697265625, -5.7578125, -4.5458984375, -3.333984375, -2.1220703125, -0.91015625, 0.3017578125, 1.513671875, 2.7255859375, 3.9375, 5.1494140625, 6.361328125, 7.5732421875, 8.78515625, 9.9970703125, 11.208984375, 12.4208984375, 13.6328125, 14.8447265625, 16.056640625, 17.2685546875, 18.48046875, 19.6923828125, 20.904296875, 22.1162109375, 23.328125, 24.5400390625, 25.751953125, 26.9638671875, 28.17578125, 29.3876953125, 30.599609375, 31.8115234375, 33.0234375, 34.2353515625, 35.447265625, 36.6591796875, 37.87109375, 39.0830078125, 40.294921875, 41.5068359375, 42.71875]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 0.0, 4.0, 3.0, 9.0, 3.0, 10.0, 7.0, 12.0, 10.0, 28.0, 20.0, 20.0, 37.0, 45.0, 54.0, 58.0, 102.0, 131.0, 229.0, 724.0, 4418.0, 1112331.0, 2021371.0, 4603.0, 730.0, 250.0, 113.0, 76.0, 70.0, 50.0, 32.0, 28.0, 24.0, 30.0, 15.0, 13.0, 6.0, 8.0, 7.0, 5.0, 7.0, 6.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-123.5625, -120.033203125, -116.50390625, -112.974609375, -109.4453125, -105.916015625, -102.38671875, -98.857421875, -95.328125, -91.798828125, -88.26953125, -84.740234375, -81.2109375, -77.681640625, -74.15234375, -70.623046875, -67.09375, -63.564453125, -60.03515625, -56.505859375, -52.9765625, -49.447265625, -45.91796875, -42.388671875, -38.859375, -35.330078125, -31.80078125, -28.271484375, -24.7421875, -21.212890625, -17.68359375, -14.154296875, -10.625, -7.095703125, -3.56640625, -0.037109375, 3.4921875, 7.021484375, 10.55078125, 14.080078125, 17.609375, 21.138671875, 24.66796875, 28.197265625, 31.7265625, 35.255859375, 38.78515625, 42.314453125, 45.84375, 49.373046875, 52.90234375, 56.431640625, 59.9609375, 63.490234375, 67.01953125, 70.548828125, 74.078125, 77.607421875, 81.13671875, 84.666015625, 88.1953125, 91.724609375, 95.25390625, 98.783203125, 102.3125]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [6.0, 24.0, 206.0, 567.0, 194.0, 20.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.761428833007812, -16.316307067871094, -9.871187210083008, -3.426067352294922, 3.019054412841797, 9.464176177978516, 15.909294128417969, 22.354415893554688, 28.799537658691406, 35.244659423828125, 41.689781188964844, 48.1348991394043, 54.580020904541016, 61.025142669677734, 67.47026062011719, 73.9153823852539, 80.36050415039062, 86.80562591552734, 93.25074768066406, 99.69586181640625, 106.1409912109375, 112.58610534667969, 119.0312271118164, 125.47634887695312, 131.92147827148438, 138.36659240722656, 144.8117218017578, 151.2568359375, 157.70196533203125, 164.14707946777344, 170.59219360351562, 177.03732299804688, 183.48245239257812, 189.9275665283203, 196.37269592285156, 202.81781005859375, 209.262939453125, 215.7080535888672, 222.15316772460938, 228.59829711914062, 235.04342651367188, 241.48854064941406, 247.9336700439453, 254.3787841796875, 260.82391357421875, 267.26904296875, 273.7141418457031, 280.1592712402344, 286.6043701171875, 293.04949951171875, 299.4945983886719, 305.9397277832031, 312.3848571777344, 318.8299865722656, 325.27508544921875, 331.72021484375, 338.16534423828125, 344.6104736328125, 351.0555725097656, 357.5007019042969, 363.9458312988281, 370.3909606933594, 376.8360595703125, 383.28118896484375, 389.726318359375]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 7.0, 3.0, 5.0, 5.0, 11.0, 12.0, 13.0, 15.0, 26.0, 17.0, 22.0, 32.0, 31.0, 36.0, 40.0, 44.0, 48.0, 41.0, 43.0, 47.0, 41.0, 38.0, 38.0, 44.0, 50.0, 38.0, 22.0, 27.0, 30.0, 32.0, 22.0, 23.0, 23.0, 14.0, 13.0, 11.0, 9.0, 11.0, 9.0, 4.0, 4.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-113.2823486328125, -109.82086181640625, -106.359375, -102.89788818359375, -99.4364013671875, -95.97491455078125, -92.513427734375, -89.05194091796875, -85.5904541015625, -82.12896728515625, -78.66748046875, -75.20599365234375, -71.7445068359375, -68.28302001953125, -64.821533203125, -61.360042572021484, -57.89855194091797, -54.43706512451172, -50.97557830810547, -47.51409149169922, -44.05260467529297, -40.59111785888672, -37.1296272277832, -33.66814041137695, -30.206653594970703, -26.745166778564453, -23.283679962158203, -19.82219123840332, -16.36070442199707, -12.89921760559082, -9.437728881835938, -5.9762420654296875, -2.5147628784179688, 0.9467244148254395, 4.408211708068848, 7.869699478149414, 11.331186294555664, 14.792673110961914, 18.254161834716797, 21.715648651123047, 25.177135467529297, 28.638622283935547, 32.1001091003418, 35.56159973144531, 39.02308654785156, 42.48457336425781, 45.94606018066406, 49.40754699707031, 52.86903381347656, 56.33052062988281, 59.79200744628906, 63.25349426269531, 66.71498107910156, 70.17646789550781, 73.63795471191406, 77.09944152832031, 80.56092834472656, 84.02241516113281, 87.48390197753906, 90.94538879394531, 94.40687561035156, 97.86836242675781, 101.32984924316406, 104.79133605957031, 108.2528305053711]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 4.0, 7.0, 11.0, 8.0, 5.0, 15.0, 11.0, 10.0, 11.0, 15.0, 22.0, 17.0, 24.0, 28.0, 29.0, 21.0, 24.0, 34.0, 37.0, 34.0, 26.0, 43.0, 33.0, 39.0, 39.0, 43.0, 32.0, 37.0, 35.0, 38.0, 20.0, 28.0, 21.0, 15.0, 28.0, 22.0, 16.0, 26.0, 17.0, 12.0, 12.0, 9.0, 6.0, 8.0, 6.0, 4.0, 6.0, 2.0, 4.0, 5.0, 2.0, 3.0, 0.0, 2.0], "bins": [-10.7890625, -10.4666748046875, -10.144287109375, -9.8218994140625, -9.49951171875, -9.1771240234375, -8.854736328125, -8.5323486328125, -8.2099609375, -7.8875732421875, -7.565185546875, -7.2427978515625, -6.92041015625, -6.5980224609375, -6.275634765625, -5.9532470703125, -5.630859375, -5.3084716796875, -4.986083984375, -4.6636962890625, -4.34130859375, -4.0189208984375, -3.696533203125, -3.3741455078125, -3.0517578125, -2.7293701171875, -2.406982421875, -2.0845947265625, -1.76220703125, -1.4398193359375, -1.117431640625, -0.7950439453125, -0.47265625, -0.1502685546875, 0.172119140625, 0.4945068359375, 0.81689453125, 1.1392822265625, 1.461669921875, 1.7840576171875, 2.1064453125, 2.4288330078125, 2.751220703125, 3.0736083984375, 3.39599609375, 3.7183837890625, 4.040771484375, 4.3631591796875, 4.685546875, 5.0079345703125, 5.330322265625, 5.6527099609375, 5.97509765625, 6.2974853515625, 6.619873046875, 6.9422607421875, 7.2646484375, 7.5870361328125, 7.909423828125, 8.2318115234375, 8.55419921875, 8.8765869140625, 9.198974609375, 9.5213623046875, 9.84375]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 2.0, 2.0, 1.0, 4.0, 4.0, 6.0, 16.0, 14.0, 17.0, 20.0, 31.0, 41.0, 52.0, 61.0, 111.0, 142.0, 225.0, 344.0, 613.0, 1017.0, 1889.0, 3692.0, 7855.0, 18585.0, 54549.0, 198061.0, 691037.0, 1473925.0, 1156428.0, 415178.0, 112195.0, 33789.0, 12705.0, 5335.0, 2668.0, 1403.0, 850.0, 488.0, 304.0, 169.0, 110.0, 93.0, 74.0, 50.0, 34.0, 22.0, 27.0, 10.0, 13.0, 10.0, 5.0, 6.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-13.6875, -13.2568359375, -12.826171875, -12.3955078125, -11.96484375, -11.5341796875, -11.103515625, -10.6728515625, -10.2421875, -9.8115234375, -9.380859375, -8.9501953125, -8.51953125, -8.0888671875, -7.658203125, -7.2275390625, -6.796875, -6.3662109375, -5.935546875, -5.5048828125, -5.07421875, -4.6435546875, -4.212890625, -3.7822265625, -3.3515625, -2.9208984375, -2.490234375, -2.0595703125, -1.62890625, -1.1982421875, -0.767578125, -0.3369140625, 0.09375, 0.5244140625, 0.955078125, 1.3857421875, 1.81640625, 2.2470703125, 2.677734375, 3.1083984375, 3.5390625, 3.9697265625, 4.400390625, 4.8310546875, 5.26171875, 5.6923828125, 6.123046875, 6.5537109375, 6.984375, 7.4150390625, 7.845703125, 8.2763671875, 8.70703125, 9.1376953125, 9.568359375, 9.9990234375, 10.4296875, 10.8603515625, 11.291015625, 11.7216796875, 12.15234375, 12.5830078125, 13.013671875, 13.4443359375, 13.875]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 4.0, 7.0, 5.0, 4.0, 11.0, 10.0, 26.0, 25.0, 55.0, 63.0, 93.0, 115.0, 195.0, 286.0, 391.0, 529.0, 543.0, 483.0, 362.0, 282.0, 179.0, 144.0, 82.0, 62.0, 27.0, 33.0, 22.0, 13.0, 6.0, 4.0, 11.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.09375, -22.307373046875, -21.52099609375, -20.734619140625, -19.9482421875, -19.161865234375, -18.37548828125, -17.589111328125, -16.802734375, -16.016357421875, -15.22998046875, -14.443603515625, -13.6572265625, -12.870849609375, -12.08447265625, -11.298095703125, -10.51171875, -9.725341796875, -8.93896484375, -8.152587890625, -7.3662109375, -6.579833984375, -5.79345703125, -5.007080078125, -4.220703125, -3.434326171875, -2.64794921875, -1.861572265625, -1.0751953125, -0.288818359375, 0.49755859375, 1.283935546875, 2.0703125, 2.856689453125, 3.64306640625, 4.429443359375, 5.2158203125, 6.002197265625, 6.78857421875, 7.574951171875, 8.361328125, 9.147705078125, 9.93408203125, 10.720458984375, 11.5068359375, 12.293212890625, 13.07958984375, 13.865966796875, 14.65234375, 15.438720703125, 16.22509765625, 17.011474609375, 17.7978515625, 18.584228515625, 19.37060546875, 20.156982421875, 20.943359375, 21.729736328125, 22.51611328125, 23.302490234375, 24.0888671875, 24.875244140625, 25.66162109375, 26.447998046875, 27.234375]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 3.0, 12.0, 11.0, 15.0, 20.0, 31.0, 41.0, 59.0, 94.0, 147.0, 226.0, 366.0, 726.0, 2537.0, 52496.0, 3884136.0, 246231.0, 4943.0, 969.0, 439.0, 269.0, 174.0, 97.0, 85.0, 55.0, 38.0, 23.0, 14.0, 10.0, 4.0, 5.0, 4.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-94.1875, -91.388671875, -88.58984375, -85.791015625, -82.9921875, -80.193359375, -77.39453125, -74.595703125, -71.796875, -68.998046875, -66.19921875, -63.400390625, -60.6015625, -57.802734375, -55.00390625, -52.205078125, -49.40625, -46.607421875, -43.80859375, -41.009765625, -38.2109375, -35.412109375, -32.61328125, -29.814453125, -27.015625, -24.216796875, -21.41796875, -18.619140625, -15.8203125, -13.021484375, -10.22265625, -7.423828125, -4.625, -1.826171875, 0.97265625, 3.771484375, 6.5703125, 9.369140625, 12.16796875, 14.966796875, 17.765625, 20.564453125, 23.36328125, 26.162109375, 28.9609375, 31.759765625, 34.55859375, 37.357421875, 40.15625, 42.955078125, 45.75390625, 48.552734375, 51.3515625, 54.150390625, 56.94921875, 59.748046875, 62.546875, 65.345703125, 68.14453125, 70.943359375, 73.7421875, 76.541015625, 79.33984375, 82.138671875, 84.9375]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 32.0, 103.0, 200.0, 301.0, 221.0, 115.0, 30.0, 4.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-195.31478881835938, -187.926513671875, -180.5382537841797, -173.1499786376953, -165.76170349121094, -158.37344360351562, -150.98516845703125, -143.59689331054688, -136.20863342285156, -128.8203582763672, -121.43209075927734, -114.0438232421875, -106.65555572509766, -99.26728820800781, -91.87901306152344, -84.4907455444336, -77.10247039794922, -69.71420288085938, -62.325931549072266, -54.937660217285156, -47.54939270019531, -40.1611213684082, -32.772850036621094, -25.38458251953125, -17.99631118774414, -10.608041763305664, -3.219771385192871, 4.168498992919922, 11.556768417358398, 18.945037841796875, 26.333309173583984, 33.72157669067383, 41.10984802246094, 48.49811935424805, 55.88638687133789, 63.274658203125, 70.66292572021484, 78.05119323730469, 85.43946838378906, 92.8277359008789, 100.21600341796875, 107.6042709350586, 114.99254608154297, 122.38081359863281, 129.7690887451172, 137.1573486328125, 144.54562377929688, 151.93389892578125, 159.32217407226562, 166.71044921875, 174.0987091064453, 181.4869842529297, 188.87525939941406, 196.26351928710938, 203.65179443359375, 211.04006958007812, 218.42832946777344, 225.8166046142578, 233.20486450195312, 240.5931396484375, 247.98141479492188, 255.3696746826172, 262.7579345703125, 270.1462097167969, 277.53448486328125]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 3.0, 5.0, 5.0, 8.0, 10.0, 17.0, 19.0, 7.0, 14.0, 21.0, 31.0, 26.0, 35.0, 31.0, 28.0, 46.0, 38.0, 37.0, 39.0, 44.0, 45.0, 40.0, 52.0, 50.0, 30.0, 26.0, 42.0, 30.0, 31.0, 23.0, 28.0, 26.0, 14.0, 18.0, 18.0, 14.0, 12.0, 15.0, 5.0, 5.0, 5.0, 2.0, 4.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.4449462890625, -58.251590728759766, -56.05823516845703, -53.8648796081543, -51.67152404785156, -49.478172302246094, -47.28481674194336, -45.091461181640625, -42.89810562133789, -40.704750061035156, -38.51139450073242, -36.31803894042969, -34.12468719482422, -31.93132972717285, -29.73797607421875, -27.544620513916016, -25.35126495361328, -23.157909393310547, -20.964553833007812, -18.77120018005371, -16.577844619750977, -14.384489059448242, -12.191134452819824, -9.997779846191406, -7.804424285888672, -5.611069202423096, -3.4177141189575195, -1.2243590354919434, 0.9689960479736328, 3.162351608276367, 5.355706214904785, 7.549060821533203, 9.742416381835938, 11.935771942138672, 14.12912654876709, 16.322481155395508, 18.515836715698242, 20.709192276000977, 22.902545928955078, 25.095901489257812, 27.289257049560547, 29.48261260986328, 31.675968170166016, 33.86932373046875, 36.06267547607422, 38.25603485107422, 40.44938659667969, 42.64274215698242, 44.836097717285156, 47.02945327758789, 49.222808837890625, 51.41616439819336, 53.609519958496094, 55.80287170410156, 57.9962272644043, 60.18958282470703, 62.382938385009766, 64.5762939453125, 66.76964569091797, 68.96300506591797, 71.15635681152344, 73.34971618652344, 75.5430679321289, 77.73641967773438, 79.92977905273438]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 6.0, 1.0, 6.0, 5.0, 4.0, 9.0, 11.0, 11.0, 7.0, 14.0, 15.0, 25.0, 23.0, 20.0, 22.0, 30.0, 31.0, 30.0, 42.0, 41.0, 36.0, 35.0, 37.0, 43.0, 40.0, 42.0, 50.0, 29.0, 40.0, 33.0, 36.0, 21.0, 19.0, 22.0, 16.0, 24.0, 19.0, 18.0, 20.0, 20.0, 11.0, 4.0, 9.0, 10.0, 4.0, 5.0, 2.0, 3.0, 0.0, 3.0, 3.0, 1.0, 1.0], "bins": [-11.7421875, -11.4044189453125, -11.066650390625, -10.7288818359375, -10.39111328125, -10.0533447265625, -9.715576171875, -9.3778076171875, -9.0400390625, -8.7022705078125, -8.364501953125, -8.0267333984375, -7.68896484375, -7.3511962890625, -7.013427734375, -6.6756591796875, -6.337890625, -6.0001220703125, -5.662353515625, -5.3245849609375, -4.98681640625, -4.6490478515625, -4.311279296875, -3.9735107421875, -3.6357421875, -3.2979736328125, -2.960205078125, -2.6224365234375, -2.28466796875, -1.9468994140625, -1.609130859375, -1.2713623046875, -0.93359375, -0.5958251953125, -0.258056640625, 0.0797119140625, 0.41748046875, 0.7552490234375, 1.093017578125, 1.4307861328125, 1.7685546875, 2.1063232421875, 2.444091796875, 2.7818603515625, 3.11962890625, 3.4573974609375, 3.795166015625, 4.1329345703125, 4.470703125, 4.8084716796875, 5.146240234375, 5.4840087890625, 5.82177734375, 6.1595458984375, 6.497314453125, 6.8350830078125, 7.1728515625, 7.5106201171875, 7.848388671875, 8.1861572265625, 8.52392578125, 8.8616943359375, 9.199462890625, 9.5372314453125, 9.875]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 5.0, 5.0, 7.0, 21.0, 15.0, 20.0, 37.0, 48.0, 73.0, 127.0, 152.0, 223.0, 332.0, 524.0, 744.0, 1120.0, 1583.0, 2354.0, 3309.0, 4829.0, 7164.0, 10470.0, 15703.0, 23708.0, 35778.0, 55189.0, 83800.0, 120954.0, 155934.0, 155330.0, 121076.0, 84124.0, 54938.0, 35896.0, 23955.0, 15697.0, 10547.0, 7028.0, 4962.0, 3288.0, 2351.0, 1652.0, 1107.0, 735.0, 494.0, 374.0, 260.0, 147.0, 137.0, 72.0, 55.0, 37.0, 27.0, 21.0, 14.0, 11.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.72900390625, -0.7054901123046875, -0.681976318359375, -0.6584625244140625, -0.63494873046875, -0.6114349365234375, -0.587921142578125, -0.5644073486328125, -0.5408935546875, -0.5173797607421875, -0.493865966796875, -0.4703521728515625, -0.44683837890625, -0.4233245849609375, -0.399810791015625, -0.3762969970703125, -0.352783203125, -0.3292694091796875, -0.305755615234375, -0.2822418212890625, -0.25872802734375, -0.2352142333984375, -0.211700439453125, -0.1881866455078125, -0.1646728515625, -0.1411590576171875, -0.117645263671875, -0.0941314697265625, -0.07061767578125, -0.0471038818359375, -0.023590087890625, -7.62939453125e-05, 0.0234375, 0.0469512939453125, 0.070465087890625, 0.0939788818359375, 0.11749267578125, 0.1410064697265625, 0.164520263671875, 0.1880340576171875, 0.2115478515625, 0.2350616455078125, 0.258575439453125, 0.2820892333984375, 0.30560302734375, 0.3291168212890625, 0.352630615234375, 0.3761444091796875, 0.399658203125, 0.4231719970703125, 0.446685791015625, 0.4701995849609375, 0.49371337890625, 0.5172271728515625, 0.540740966796875, 0.5642547607421875, 0.5877685546875, 0.6112823486328125, 0.634796142578125, 0.6583099365234375, 0.68182373046875, 0.7053375244140625, 0.728851318359375, 0.7523651123046875, 0.77587890625]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 4.0, 7.0, 4.0, 9.0, 10.0, 15.0, 8.0, 20.0, 19.0, 29.0, 27.0, 26.0, 34.0, 36.0, 19.0, 41.0, 55.0, 45.0, 28.0, 56.0, 1070.0, 40.0, 54.0, 44.0, 44.0, 37.0, 38.0, 32.0, 20.0, 18.0, 32.0, 13.0, 17.0, 23.0, 10.0, 9.0, 7.0, 13.0, 3.0, 1.0, 4.0, 3.0, 2.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.0, -6.74560546875, -6.4912109375, -6.23681640625, -5.982421875, -5.72802734375, -5.4736328125, -5.21923828125, -4.96484375, -4.71044921875, -4.4560546875, -4.20166015625, -3.947265625, -3.69287109375, -3.4384765625, -3.18408203125, -2.9296875, -2.67529296875, -2.4208984375, -2.16650390625, -1.912109375, -1.65771484375, -1.4033203125, -1.14892578125, -0.89453125, -0.64013671875, -0.3857421875, -0.13134765625, 0.123046875, 0.37744140625, 0.6318359375, 0.88623046875, 1.140625, 1.39501953125, 1.6494140625, 1.90380859375, 2.158203125, 2.41259765625, 2.6669921875, 2.92138671875, 3.17578125, 3.43017578125, 3.6845703125, 3.93896484375, 4.193359375, 4.44775390625, 4.7021484375, 4.95654296875, 5.2109375, 5.46533203125, 5.7197265625, 5.97412109375, 6.228515625, 6.48291015625, 6.7373046875, 6.99169921875, 7.24609375, 7.50048828125, 7.7548828125, 8.00927734375, 8.263671875, 8.51806640625, 8.7724609375, 9.02685546875, 9.28125]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 5.0, 3.0, 7.0, 7.0, 20.0, 22.0, 37.0, 55.0, 60.0, 108.0, 174.0, 270.0, 415.0, 589.0, 920.0, 1438.0, 2286.0, 3963.0, 6298.0, 10375.0, 17441.0, 28710.0, 46950.0, 74715.0, 111638.0, 170529.0, 1186586.0, 150491.0, 104453.0, 68432.0, 43180.0, 26064.0, 15918.0, 9740.0, 5863.0, 3580.0, 2132.0, 1311.0, 854.0, 496.0, 332.0, 251.0, 125.0, 80.0, 74.0, 47.0, 23.0, 30.0, 16.0, 9.0, 4.0, 2.0, 3.0, 2.0, 3.0, 3.0, 1.0], "bins": [-0.650390625, -0.63092041015625, -0.6114501953125, -0.59197998046875, -0.572509765625, -0.55303955078125, -0.5335693359375, -0.51409912109375, -0.49462890625, -0.47515869140625, -0.4556884765625, -0.43621826171875, -0.416748046875, -0.39727783203125, -0.3778076171875, -0.35833740234375, -0.3388671875, -0.31939697265625, -0.2999267578125, -0.28045654296875, -0.260986328125, -0.24151611328125, -0.2220458984375, -0.20257568359375, -0.18310546875, -0.16363525390625, -0.1441650390625, -0.12469482421875, -0.105224609375, -0.08575439453125, -0.0662841796875, -0.04681396484375, -0.02734375, -0.00787353515625, 0.0115966796875, 0.03106689453125, 0.050537109375, 0.07000732421875, 0.0894775390625, 0.10894775390625, 0.12841796875, 0.14788818359375, 0.1673583984375, 0.18682861328125, 0.206298828125, 0.22576904296875, 0.2452392578125, 0.26470947265625, 0.2841796875, 0.30364990234375, 0.3231201171875, 0.34259033203125, 0.362060546875, 0.38153076171875, 0.4010009765625, 0.42047119140625, 0.43994140625, 0.45941162109375, 0.4788818359375, 0.49835205078125, 0.517822265625, 0.53729248046875, 0.5567626953125, 0.57623291015625, 0.595703125]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 4.0, 0.0, 4.0, 6.0, 5.0, 10.0, 9.0, 11.0, 3.0, 15.0, 18.0, 17.0, 21.0, 25.0, 42.0, 62.0, 76.0, 75.0, 105.0, 107.0, 98.0, 72.0, 42.0, 40.0, 21.0, 25.0, 22.0, 14.0, 12.0, 7.0, 10.0, 4.0, 9.0, 2.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0293731689453125, -0.028477907180786133, -0.027582645416259766, -0.0266873836517334, -0.02579212188720703, -0.024896860122680664, -0.024001598358154297, -0.02310633659362793, -0.022211074829101562, -0.021315813064575195, -0.020420551300048828, -0.01952528953552246, -0.018630027770996094, -0.017734766006469727, -0.01683950424194336, -0.015944242477416992, -0.015048980712890625, -0.014153718948364258, -0.01325845718383789, -0.012363195419311523, -0.011467933654785156, -0.010572671890258789, -0.009677410125732422, -0.008782148361206055, -0.007886886596679688, -0.00699162483215332, -0.006096363067626953, -0.005201101303100586, -0.004305839538574219, -0.0034105777740478516, -0.0025153160095214844, -0.0016200542449951172, -0.00072479248046875, 0.0001704692840576172, 0.0010657310485839844, 0.0019609928131103516, 0.0028562545776367188, 0.003751516342163086, 0.004646778106689453, 0.00554203987121582, 0.0064373016357421875, 0.007332563400268555, 0.008227825164794922, 0.009123086929321289, 0.010018348693847656, 0.010913610458374023, 0.01180887222290039, 0.012704133987426758, 0.013599395751953125, 0.014494657516479492, 0.01538991928100586, 0.016285181045532227, 0.017180442810058594, 0.01807570457458496, 0.018970966339111328, 0.019866228103637695, 0.020761489868164062, 0.02165675163269043, 0.022552013397216797, 0.023447275161743164, 0.02434253692626953, 0.0252377986907959, 0.026133060455322266, 0.027028322219848633, 0.027923583984375]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 6.0, 4.0, 3.0, 6.0, 13.0, 10.0, 15.0, 12.0, 25.0, 34.0, 42.0, 43.0, 79.0, 119.0, 224.0, 574.0, 18072.0, 1023958.0, 4301.0, 389.0, 219.0, 125.0, 76.0, 39.0, 23.0, 40.0, 19.0, 13.0, 13.0, 11.0, 15.0, 10.0, 8.0, 6.0, 5.0, 3.0, 3.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5732421875, -0.5543746948242188, -0.5355072021484375, -0.5166397094726562, -0.497772216796875, -0.47890472412109375, -0.4600372314453125, -0.44116973876953125, -0.42230224609375, -0.40343475341796875, -0.3845672607421875, -0.36569976806640625, -0.346832275390625, -0.32796478271484375, -0.3090972900390625, -0.29022979736328125, -0.2713623046875, -0.25249481201171875, -0.2336273193359375, -0.21475982666015625, -0.195892333984375, -0.17702484130859375, -0.1581573486328125, -0.13928985595703125, -0.12042236328125, -0.10155487060546875, -0.0826873779296875, -0.06381988525390625, -0.044952392578125, -0.02608489990234375, -0.0072174072265625, 0.01165008544921875, 0.030517578125, 0.04938507080078125, 0.0682525634765625, 0.08712005615234375, 0.105987548828125, 0.12485504150390625, 0.1437225341796875, 0.16259002685546875, 0.18145751953125, 0.20032501220703125, 0.2191925048828125, 0.23805999755859375, 0.256927490234375, 0.27579498291015625, 0.2946624755859375, 0.31352996826171875, 0.3323974609375, 0.35126495361328125, 0.3701324462890625, 0.38899993896484375, 0.407867431640625, 0.42673492431640625, 0.4456024169921875, 0.46446990966796875, 0.48333740234375, 0.5022048950195312, 0.5210723876953125, 0.5399398803710938, 0.558807373046875, 0.5776748657226562, 0.5965423583984375, 0.6154098510742188, 0.63427734375]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 218.0, 775.0, 20.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.041298989206552505, -0.03557164967060089, -0.02984430640935898, -0.024116966873407364, -0.0183896254748106, -0.012662284076213837, -0.006934944540262222, -0.0012076012790203094, 0.004519738256931305, 0.010247079655528069, 0.015974421054124832, 0.021701760590076447, 0.02742910198867321, 0.033156443387269974, 0.03888378292322159, 0.0446111261844635, 0.050338465720415115, 0.05606580525636673, 0.06179314851760864, 0.06752048432826996, 0.07324782758951187, 0.07897517085075378, 0.0847025066614151, 0.09042985737323761, 0.09615719318389893, 0.10188453644514084, 0.10761187225580215, 0.11333921551704407, 0.11906655877828598, 0.1247939020395279, 0.1305212378501892, 0.13624858856201172, 0.14197592437267303, 0.14770326018333435, 0.15343061089515686, 0.15915794670581818, 0.1648852825164795, 0.170612633228302, 0.17633996903896332, 0.18206730484962463, 0.18779465556144714, 0.19352199137210846, 0.19924934208393097, 0.20497667789459229, 0.2107040137052536, 0.2164313644170761, 0.22215870022773743, 0.22788605093955994, 0.23361337184906006, 0.23934070765972137, 0.24506805837154388, 0.2507953941822052, 0.2565227448940277, 0.26225006580352783, 0.26797741651535034, 0.27370476722717285, 0.27943211793899536, 0.28515946865081787, 0.290886789560318, 0.2966141402721405, 0.302341490983963, 0.30806881189346313, 0.31379616260528564, 0.31952351331710815, 0.3252508342266083]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 7.0, 4.0, 7.0, 8.0, 12.0, 13.0, 17.0, 19.0, 33.0, 28.0, 34.0, 51.0, 46.0, 53.0, 56.0, 57.0, 60.0, 53.0, 66.0, 51.0, 55.0, 54.0, 53.0, 34.0, 37.0, 25.0, 23.0, 13.0, 14.0, 9.0, 9.0, 5.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.02470952272415161, -0.02404044382274151, -0.023371364921331406, -0.022702286019921303, -0.0220332071185112, -0.021364128217101097, -0.020695049315690994, -0.02002597041428089, -0.01935689151287079, -0.018687812611460686, -0.018018733710050583, -0.01734965480864048, -0.016680575907230377, -0.016011497005820274, -0.015342418104410172, -0.014673339203000069, -0.014004260301589966, -0.013335181400179863, -0.01266610249876976, -0.011997023597359657, -0.011327944695949554, -0.010658865794539452, -0.009989786893129349, -0.009320707991719246, -0.008651629090309143, -0.00798255018889904, -0.007313471287488937, -0.0066443923860788345, -0.005975313484668732, -0.005306234583258629, -0.004637155681848526, -0.003968076780438423, -0.0032989978790283203, -0.0026299189776182175, -0.0019608400762081146, -0.0012917611747980118, -0.0006226822733879089, 4.639662802219391e-05, 0.0007154755294322968, 0.0013845544308423996, 0.0020536333322525024, 0.0027227122336626053, 0.003391791135072708, 0.004060870036482811, 0.004729948937892914, 0.005399027839303017, 0.0060681067407131195, 0.006737185642123222, 0.007406264543533325, 0.008075343444943428, 0.008744422346353531, 0.009413501247763634, 0.010082580149173737, 0.01075165905058384, 0.011420737951993942, 0.012089816853404045, 0.012758895754814148, 0.01342797465622425, 0.014097053557634354, 0.014766132459044456, 0.01543521136045456, 0.016104290261864662, 0.016773369163274765, 0.017442448064684868, 0.01811152696609497]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 6.0, 1.0, 6.0, 5.0, 4.0, 9.0, 11.0, 11.0, 7.0, 14.0, 15.0, 25.0, 23.0, 20.0, 22.0, 30.0, 31.0, 30.0, 42.0, 41.0, 36.0, 35.0, 37.0, 43.0, 40.0, 42.0, 50.0, 29.0, 40.0, 33.0, 36.0, 19.0, 20.0, 22.0, 17.0, 24.0, 18.0, 19.0, 20.0, 20.0, 11.0, 4.0, 9.0, 10.0, 4.0, 5.0, 2.0, 3.0, 0.0, 3.0, 3.0, 1.0, 1.0], "bins": [-11.7421875, -11.4044189453125, -11.066650390625, -10.7288818359375, -10.39111328125, -10.0533447265625, -9.715576171875, -9.3778076171875, -9.0400390625, -8.7022705078125, -8.364501953125, -8.0267333984375, -7.68896484375, -7.3511962890625, -7.013427734375, -6.6756591796875, -6.337890625, -6.0001220703125, -5.662353515625, -5.3245849609375, -4.98681640625, -4.6490478515625, -4.311279296875, -3.9735107421875, -3.6357421875, -3.2979736328125, -2.960205078125, -2.6224365234375, -2.28466796875, -1.9468994140625, -1.609130859375, -1.2713623046875, -0.93359375, -0.5958251953125, -0.258056640625, 0.0797119140625, 0.41748046875, 0.7552490234375, 1.093017578125, 1.4307861328125, 1.7685546875, 2.1063232421875, 2.444091796875, 2.7818603515625, 3.11962890625, 3.4573974609375, 3.795166015625, 4.1329345703125, 4.470703125, 4.8084716796875, 5.146240234375, 5.4840087890625, 5.82177734375, 6.1595458984375, 6.497314453125, 6.8350830078125, 7.1728515625, 7.5106201171875, 7.848388671875, 8.1861572265625, 8.52392578125, 8.8616943359375, 9.199462890625, 9.5372314453125, 9.875]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 2.0, 7.0, 5.0, 5.0, 8.0, 9.0, 9.0, 14.0, 27.0, 19.0, 51.0, 66.0, 116.0, 189.0, 267.0, 438.0, 786.0, 1343.0, 2528.0, 4683.0, 8834.0, 17090.0, 35437.0, 81461.0, 218451.0, 375839.0, 172606.0, 66879.0, 30055.0, 14734.0, 7369.0, 3939.0, 2171.0, 1204.0, 736.0, 416.0, 258.0, 177.0, 106.0, 71.0, 49.0, 35.0, 12.0, 16.0, 12.0, 10.0, 5.0, 5.0, 2.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-9.8828125, -9.5867919921875, -9.290771484375, -8.9947509765625, -8.69873046875, -8.4027099609375, -8.106689453125, -7.8106689453125, -7.5146484375, -7.2186279296875, -6.922607421875, -6.6265869140625, -6.33056640625, -6.0345458984375, -5.738525390625, -5.4425048828125, -5.146484375, -4.8504638671875, -4.554443359375, -4.2584228515625, -3.96240234375, -3.6663818359375, -3.370361328125, -3.0743408203125, -2.7783203125, -2.4822998046875, -2.186279296875, -1.8902587890625, -1.59423828125, -1.2982177734375, -1.002197265625, -0.7061767578125, -0.41015625, -0.1141357421875, 0.181884765625, 0.4779052734375, 0.77392578125, 1.0699462890625, 1.365966796875, 1.6619873046875, 1.9580078125, 2.2540283203125, 2.550048828125, 2.8460693359375, 3.14208984375, 3.4381103515625, 3.734130859375, 4.0301513671875, 4.326171875, 4.6221923828125, 4.918212890625, 5.2142333984375, 5.51025390625, 5.8062744140625, 6.102294921875, 6.3983154296875, 6.6943359375, 6.9903564453125, 7.286376953125, 7.5823974609375, 7.87841796875, 8.1744384765625, 8.470458984375, 8.7664794921875, 9.0625]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 7.0, 11.0, 12.0, 14.0, 10.0, 9.0, 15.0, 21.0, 36.0, 25.0, 32.0, 28.0, 35.0, 41.0, 44.0, 60.0, 74.0, 154.0, 1547.0, 341.0, 117.0, 57.0, 38.0, 34.0, 36.0, 34.0, 47.0, 20.0, 20.0, 27.0, 9.0, 20.0, 15.0, 10.0, 11.0, 10.0, 5.0, 3.0, 8.0, 6.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-35.4375, -34.28857421875, -33.1396484375, -31.99072265625, -30.841796875, -29.69287109375, -28.5439453125, -27.39501953125, -26.24609375, -25.09716796875, -23.9482421875, -22.79931640625, -21.650390625, -20.50146484375, -19.3525390625, -18.20361328125, -17.0546875, -15.90576171875, -14.7568359375, -13.60791015625, -12.458984375, -11.31005859375, -10.1611328125, -9.01220703125, -7.86328125, -6.71435546875, -5.5654296875, -4.41650390625, -3.267578125, -2.11865234375, -0.9697265625, 0.17919921875, 1.328125, 2.47705078125, 3.6259765625, 4.77490234375, 5.923828125, 7.07275390625, 8.2216796875, 9.37060546875, 10.51953125, 11.66845703125, 12.8173828125, 13.96630859375, 15.115234375, 16.26416015625, 17.4130859375, 18.56201171875, 19.7109375, 20.85986328125, 22.0087890625, 23.15771484375, 24.306640625, 25.45556640625, 26.6044921875, 27.75341796875, 28.90234375, 30.05126953125, 31.2001953125, 32.34912109375, 33.498046875, 34.64697265625, 35.7958984375, 36.94482421875, 38.09375]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 1.0, 2.0, 5.0, 6.0, 9.0, 8.0, 19.0, 23.0, 13.0, 20.0, 34.0, 29.0, 32.0, 71.0, 82.0, 115.0, 123.0, 191.0, 285.0, 524.0, 1928.0, 37743.0, 2987917.0, 110950.0, 3619.0, 696.0, 381.0, 229.0, 146.0, 121.0, 83.0, 72.0, 56.0, 35.0, 32.0, 17.0, 19.0, 17.0, 13.0, 15.0, 7.0, 6.0, 3.0, 4.0, 2.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-61.78125, -59.8876953125, -57.994140625, -56.1005859375, -54.20703125, -52.3134765625, -50.419921875, -48.5263671875, -46.6328125, -44.7392578125, -42.845703125, -40.9521484375, -39.05859375, -37.1650390625, -35.271484375, -33.3779296875, -31.484375, -29.5908203125, -27.697265625, -25.8037109375, -23.91015625, -22.0166015625, -20.123046875, -18.2294921875, -16.3359375, -14.4423828125, -12.548828125, -10.6552734375, -8.76171875, -6.8681640625, -4.974609375, -3.0810546875, -1.1875, 0.7060546875, 2.599609375, 4.4931640625, 6.38671875, 8.2802734375, 10.173828125, 12.0673828125, 13.9609375, 15.8544921875, 17.748046875, 19.6416015625, 21.53515625, 23.4287109375, 25.322265625, 27.2158203125, 29.109375, 31.0029296875, 32.896484375, 34.7900390625, 36.68359375, 38.5771484375, 40.470703125, 42.3642578125, 44.2578125, 46.1513671875, 48.044921875, 49.9384765625, 51.83203125, 53.7255859375, 55.619140625, 57.5126953125, 59.40625]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 34.0, 516.0, 441.0, 26.0, 1.0, 0.0, 1.0], "bins": [-482.9097595214844, -474.7137756347656, -466.5177917480469, -458.3218078613281, -450.1258239746094, -441.9298400878906, -433.7338562011719, -425.537841796875, -417.34185791015625, -409.1458740234375, -400.94989013671875, -392.75390625, -384.55792236328125, -376.3619384765625, -368.16595458984375, -359.969970703125, -351.77398681640625, -343.5780029296875, -335.38201904296875, -327.18603515625, -318.99005126953125, -310.7940673828125, -302.59808349609375, -294.402099609375, -286.20611572265625, -278.0101318359375, -269.81414794921875, -261.6181640625, -253.42218017578125, -245.2261962890625, -237.0301971435547, -228.83421325683594, -220.63818359375, -212.44219970703125, -204.2462158203125, -196.05023193359375, -187.854248046875, -179.65826416015625, -171.46226501464844, -163.2662811279297, -155.07029724121094, -146.8743133544922, -138.67832946777344, -130.4823455810547, -122.2863540649414, -114.09037017822266, -105.89437866210938, -97.69839477539062, -89.50241088867188, -81.30642700195312, -73.11044311523438, -64.9144515991211, -56.718467712402344, -48.522483825683594, -40.32649612426758, -32.13050842285156, -23.934524536132812, -15.73853874206543, -7.542552947998047, 0.6534328460693359, 8.849418640136719, 17.04540252685547, 25.241390228271484, 33.4373779296875, 41.63336181640625]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 4.0, 6.0, 12.0, 13.0, 17.0, 16.0, 17.0, 18.0, 28.0, 32.0, 20.0, 39.0, 34.0, 38.0, 42.0, 36.0, 51.0, 41.0, 41.0, 35.0, 44.0, 42.0, 41.0, 41.0, 45.0, 39.0, 24.0, 24.0, 25.0, 22.0, 24.0, 17.0, 11.0, 12.0, 11.0, 8.0, 6.0, 3.0, 4.0, 7.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.49349975585938, -81.39781188964844, -78.30211639404297, -75.20642852783203, -72.1107406616211, -69.01504516601562, -65.91935729980469, -62.82366943359375, -59.72797775268555, -56.632286071777344, -53.536598205566406, -50.4409065246582, -47.34521484375, -44.24952697753906, -41.15383529663086, -38.058143615722656, -34.96245574951172, -31.86676597595215, -28.771076202392578, -25.675384521484375, -22.579694747924805, -19.484004974365234, -16.38831329345703, -13.292623519897461, -10.19693374633789, -7.101243495941162, -4.005553245544434, -0.9098625183105469, 2.1858272552490234, 5.281517028808594, 8.377208709716797, 11.472898483276367, 14.568588256835938, 17.664278030395508, 20.759967803955078, 23.85565948486328, 26.95134925842285, 30.047039031982422, 33.142730712890625, 36.23841857910156, 39.334110260009766, 42.42980194091797, 45.525489807128906, 48.62118148803711, 51.71687316894531, 54.81256103515625, 57.90825271606445, 61.003944396972656, 64.0996322631836, 67.19532012939453, 70.291015625, 73.38670349121094, 76.48239135742188, 79.57807922363281, 82.67377471923828, 85.76946258544922, 88.86515808105469, 91.96084594726562, 95.0565414428711, 98.15222930908203, 101.24791717529297, 104.34361267089844, 107.43930053710938, 110.53498840332031, 113.63067626953125]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 5.0, 9.0, 1.0, 5.0, 5.0, 14.0, 13.0, 18.0, 19.0, 25.0, 13.0, 18.0, 23.0, 23.0, 26.0, 42.0, 32.0, 37.0, 48.0, 37.0, 37.0, 44.0, 42.0, 50.0, 43.0, 39.0, 37.0, 36.0, 29.0, 31.0, 20.0, 24.0, 18.0, 22.0, 23.0, 13.0, 22.0, 10.0, 12.0, 7.0, 7.0, 4.0, 6.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-12.2734375, -11.921142578125, -11.56884765625, -11.216552734375, -10.8642578125, -10.511962890625, -10.15966796875, -9.807373046875, -9.455078125, -9.102783203125, -8.75048828125, -8.398193359375, -8.0458984375, -7.693603515625, -7.34130859375, -6.989013671875, -6.63671875, -6.284423828125, -5.93212890625, -5.579833984375, -5.2275390625, -4.875244140625, -4.52294921875, -4.170654296875, -3.818359375, -3.466064453125, -3.11376953125, -2.761474609375, -2.4091796875, -2.056884765625, -1.70458984375, -1.352294921875, -1.0, -0.647705078125, -0.29541015625, 0.056884765625, 0.4091796875, 0.761474609375, 1.11376953125, 1.466064453125, 1.818359375, 2.170654296875, 2.52294921875, 2.875244140625, 3.2275390625, 3.579833984375, 3.93212890625, 4.284423828125, 4.63671875, 4.989013671875, 5.34130859375, 5.693603515625, 6.0458984375, 6.398193359375, 6.75048828125, 7.102783203125, 7.455078125, 7.807373046875, 8.15966796875, 8.511962890625, 8.8642578125, 9.216552734375, 9.56884765625, 9.921142578125, 10.2734375]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 1.0, 2.0, 4.0, 5.0, 13.0, 5.0, 12.0, 9.0, 21.0, 26.0, 25.0, 29.0, 45.0, 49.0, 54.0, 112.0, 174.0, 383.0, 887.0, 2540.0, 9826.0, 55300.0, 546595.0, 2784951.0, 708648.0, 68423.0, 11345.0, 2812.0, 959.0, 410.0, 195.0, 105.0, 70.0, 56.0, 46.0, 30.0, 28.0, 16.0, 15.0, 6.0, 6.0, 9.0, 11.0, 11.0, 9.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0], "bins": [-28.5625, -27.73583984375, -26.9091796875, -26.08251953125, -25.255859375, -24.42919921875, -23.6025390625, -22.77587890625, -21.94921875, -21.12255859375, -20.2958984375, -19.46923828125, -18.642578125, -17.81591796875, -16.9892578125, -16.16259765625, -15.3359375, -14.50927734375, -13.6826171875, -12.85595703125, -12.029296875, -11.20263671875, -10.3759765625, -9.54931640625, -8.72265625, -7.89599609375, -7.0693359375, -6.24267578125, -5.416015625, -4.58935546875, -3.7626953125, -2.93603515625, -2.109375, -1.28271484375, -0.4560546875, 0.37060546875, 1.197265625, 2.02392578125, 2.8505859375, 3.67724609375, 4.50390625, 5.33056640625, 6.1572265625, 6.98388671875, 7.810546875, 8.63720703125, 9.4638671875, 10.29052734375, 11.1171875, 11.94384765625, 12.7705078125, 13.59716796875, 14.423828125, 15.25048828125, 16.0771484375, 16.90380859375, 17.73046875, 18.55712890625, 19.3837890625, 20.21044921875, 21.037109375, 21.86376953125, 22.6904296875, 23.51708984375, 24.34375]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 9.0, 8.0, 15.0, 20.0, 29.0, 31.0, 54.0, 83.0, 124.0, 181.0, 277.0, 396.0, 549.0, 656.0, 534.0, 382.0, 237.0, 157.0, 120.0, 74.0, 40.0, 38.0, 26.0, 10.0, 10.0, 9.0, 7.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.890625, -27.080322265625, -26.27001953125, -25.459716796875, -24.6494140625, -23.839111328125, -23.02880859375, -22.218505859375, -21.408203125, -20.597900390625, -19.78759765625, -18.977294921875, -18.1669921875, -17.356689453125, -16.54638671875, -15.736083984375, -14.92578125, -14.115478515625, -13.30517578125, -12.494873046875, -11.6845703125, -10.874267578125, -10.06396484375, -9.253662109375, -8.443359375, -7.633056640625, -6.82275390625, -6.012451171875, -5.2021484375, -4.391845703125, -3.58154296875, -2.771240234375, -1.9609375, -1.150634765625, -0.34033203125, 0.469970703125, 1.2802734375, 2.090576171875, 2.90087890625, 3.711181640625, 4.521484375, 5.331787109375, 6.14208984375, 6.952392578125, 7.7626953125, 8.572998046875, 9.38330078125, 10.193603515625, 11.00390625, 11.814208984375, 12.62451171875, 13.434814453125, 14.2451171875, 15.055419921875, 15.86572265625, 16.676025390625, 17.486328125, 18.296630859375, 19.10693359375, 19.917236328125, 20.7275390625, 21.537841796875, 22.34814453125, 23.158447265625, 23.96875]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 10.0, 4.0, 14.0, 13.0, 28.0, 38.0, 49.0, 64.0, 88.0, 140.0, 204.0, 280.0, 572.0, 1797.0, 17385.0, 1160744.0, 2975044.0, 33580.0, 2475.0, 716.0, 305.0, 222.0, 139.0, 86.0, 61.0, 71.0, 50.0, 40.0, 22.0, 19.0, 10.0, 3.0, 4.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.875, -62.3896484375, -59.904296875, -57.4189453125, -54.93359375, -52.4482421875, -49.962890625, -47.4775390625, -44.9921875, -42.5068359375, -40.021484375, -37.5361328125, -35.05078125, -32.5654296875, -30.080078125, -27.5947265625, -25.109375, -22.6240234375, -20.138671875, -17.6533203125, -15.16796875, -12.6826171875, -10.197265625, -7.7119140625, -5.2265625, -2.7412109375, -0.255859375, 2.2294921875, 4.71484375, 7.2001953125, 9.685546875, 12.1708984375, 14.65625, 17.1416015625, 19.626953125, 22.1123046875, 24.59765625, 27.0830078125, 29.568359375, 32.0537109375, 34.5390625, 37.0244140625, 39.509765625, 41.9951171875, 44.48046875, 46.9658203125, 49.451171875, 51.9365234375, 54.421875, 56.9072265625, 59.392578125, 61.8779296875, 64.36328125, 66.8486328125, 69.333984375, 71.8193359375, 74.3046875, 76.7900390625, 79.275390625, 81.7607421875, 84.24609375, 86.7314453125, 89.216796875, 91.7021484375, 94.1875]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 20.0, 286.0, 593.0, 111.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-218.1983184814453, -201.80213928222656, -185.40594482421875, -169.009765625, -152.61358642578125, -136.21739196777344, -119.82121276855469, -103.4250259399414, -87.02883911132812, -70.63265228271484, -54.23646926879883, -37.84028625488281, -21.44409942626953, -5.04791259765625, 11.3482666015625, 27.74445343017578, 44.14064025878906, 60.536827087402344, 76.93301391601562, 93.32919311523438, 109.72537994384766, 126.12156677246094, 142.5177459716797, 158.9139404296875, 175.31011962890625, 191.706298828125, 208.1024932861328, 224.49867248535156, 240.89486694335938, 257.2910461425781, 273.6872253417969, 290.0834045410156, 306.4796142578125, 322.87579345703125, 339.27197265625, 355.66815185546875, 372.0643615722656, 388.4605407714844, 404.8567199707031, 421.2528991699219, 437.64910888671875, 454.0452880859375, 470.44146728515625, 486.837646484375, 503.2338562011719, 519.6300048828125, 536.0262451171875, 552.4224243164062, 568.818603515625, 585.2147827148438, 601.6109619140625, 618.0071411132812, 634.4033203125, 650.799560546875, 667.1956787109375, 683.5919189453125, 699.988037109375, 716.3842163085938, 732.7803955078125, 749.1765747070312, 765.57275390625, 781.968994140625, 798.3651123046875, 814.7613525390625, 831.1575317382812]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 6.0, 3.0, 4.0, 11.0, 10.0, 15.0, 12.0, 12.0, 22.0, 28.0, 31.0, 30.0, 26.0, 30.0, 35.0, 31.0, 39.0, 44.0, 39.0, 40.0, 55.0, 68.0, 46.0, 40.0, 41.0, 29.0, 39.0, 40.0, 25.0, 29.0, 23.0, 20.0, 21.0, 9.0, 12.0, 11.0, 7.0, 8.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-61.515350341796875, -59.27070999145508, -57.02606964111328, -54.78142547607422, -52.53678512573242, -50.292144775390625, -48.04750061035156, -45.802860260009766, -43.55821990966797, -41.31357955932617, -39.068939208984375, -36.82429504394531, -34.579654693603516, -32.33501434326172, -30.09037208557129, -27.84572982788086, -25.601089477539062, -23.356449127197266, -21.111806869506836, -18.867164611816406, -16.62252426147461, -14.377882957458496, -12.133241653442383, -9.88860034942627, -7.643959045410156, -5.399317741394043, -3.1546764373779297, -0.9100351333618164, 1.3346061706542969, 3.57924747467041, 5.823888778686523, 8.068530082702637, 10.31317138671875, 12.557812690734863, 14.802453994750977, 17.047096252441406, 19.291736602783203, 21.536376953125, 23.78101921081543, 26.02566146850586, 28.270301818847656, 30.514942169189453, 32.75958251953125, 35.00422668457031, 37.24886703491211, 39.493507385253906, 41.73815155029297, 43.982791900634766, 46.22743225097656, 48.47207260131836, 50.716712951660156, 52.96135711669922, 55.205997467041016, 57.45063781738281, 59.695281982421875, 61.93992233276367, 64.18456268310547, 66.42920684814453, 68.67384338378906, 70.91848754882812, 73.16313171386719, 75.40776824951172, 77.65241241455078, 79.89704895019531, 82.14169311523438]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 3.0, 1.0, 7.0, 10.0, 4.0, 6.0, 9.0, 14.0, 19.0, 22.0, 33.0, 26.0, 15.0, 23.0, 25.0, 36.0, 21.0, 28.0, 49.0, 37.0, 46.0, 33.0, 43.0, 29.0, 51.0, 32.0, 42.0, 34.0, 37.0, 29.0, 31.0, 31.0, 26.0, 25.0, 15.0, 22.0, 14.0, 6.0, 15.0, 9.0, 11.0, 9.0, 8.0, 7.0, 6.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.890625, -10.5458984375, -10.201171875, -9.8564453125, -9.51171875, -9.1669921875, -8.822265625, -8.4775390625, -8.1328125, -7.7880859375, -7.443359375, -7.0986328125, -6.75390625, -6.4091796875, -6.064453125, -5.7197265625, -5.375, -5.0302734375, -4.685546875, -4.3408203125, -3.99609375, -3.6513671875, -3.306640625, -2.9619140625, -2.6171875, -2.2724609375, -1.927734375, -1.5830078125, -1.23828125, -0.8935546875, -0.548828125, -0.2041015625, 0.140625, 0.4853515625, 0.830078125, 1.1748046875, 1.51953125, 1.8642578125, 2.208984375, 2.5537109375, 2.8984375, 3.2431640625, 3.587890625, 3.9326171875, 4.27734375, 4.6220703125, 4.966796875, 5.3115234375, 5.65625, 6.0009765625, 6.345703125, 6.6904296875, 7.03515625, 7.3798828125, 7.724609375, 8.0693359375, 8.4140625, 8.7587890625, 9.103515625, 9.4482421875, 9.79296875, 10.1376953125, 10.482421875, 10.8271484375, 11.171875]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [5.0, 2.0, 1.0, 7.0, 5.0, 10.0, 12.0, 21.0, 31.0, 41.0, 61.0, 104.0, 142.0, 198.0, 290.0, 404.0, 642.0, 912.0, 1328.0, 1965.0, 2776.0, 4201.0, 6165.0, 8943.0, 13220.0, 19696.0, 28906.0, 43865.0, 64265.0, 91162.0, 122845.0, 147451.0, 138285.0, 107829.0, 77764.0, 53971.0, 36209.0, 24360.0, 16211.0, 10922.0, 7330.0, 5120.0, 3334.0, 2357.0, 1657.0, 1090.0, 733.0, 539.0, 383.0, 235.0, 193.0, 121.0, 79.0, 55.0, 49.0, 19.0, 22.0, 13.0, 5.0, 4.0, 3.0, 5.0, 2.0, 1.0], "bins": [-0.7216796875, -0.6989593505859375, -0.676239013671875, -0.6535186767578125, -0.63079833984375, -0.6080780029296875, -0.585357666015625, -0.5626373291015625, -0.5399169921875, -0.5171966552734375, -0.494476318359375, -0.4717559814453125, -0.44903564453125, -0.4263153076171875, -0.403594970703125, -0.3808746337890625, -0.358154296875, -0.3354339599609375, -0.312713623046875, -0.2899932861328125, -0.26727294921875, -0.2445526123046875, -0.221832275390625, -0.1991119384765625, -0.1763916015625, -0.1536712646484375, -0.130950927734375, -0.1082305908203125, -0.08551025390625, -0.0627899169921875, -0.040069580078125, -0.0173492431640625, 0.00537109375, 0.0280914306640625, 0.050811767578125, 0.0735321044921875, 0.09625244140625, 0.1189727783203125, 0.141693115234375, 0.1644134521484375, 0.1871337890625, 0.2098541259765625, 0.232574462890625, 0.2552947998046875, 0.27801513671875, 0.3007354736328125, 0.323455810546875, 0.3461761474609375, 0.368896484375, 0.3916168212890625, 0.414337158203125, 0.4370574951171875, 0.45977783203125, 0.4824981689453125, 0.505218505859375, 0.5279388427734375, 0.5506591796875, 0.5733795166015625, 0.596099853515625, 0.6188201904296875, 0.64154052734375, 0.6642608642578125, 0.686981201171875, 0.7097015380859375, 0.732421875]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 2.0, 5.0, 3.0, 7.0, 9.0, 14.0, 8.0, 13.0, 12.0, 11.0, 19.0, 21.0, 23.0, 33.0, 31.0, 39.0, 37.0, 38.0, 28.0, 40.0, 39.0, 34.0, 1069.0, 49.0, 53.0, 47.0, 46.0, 41.0, 20.0, 32.0, 23.0, 28.0, 23.0, 18.0, 16.0, 17.0, 10.0, 15.0, 8.0, 11.0, 12.0, 10.0, 6.0, 1.0, 4.0, 5.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.80859375, -7.562255859375, -7.31591796875, -7.069580078125, -6.8232421875, -6.576904296875, -6.33056640625, -6.084228515625, -5.837890625, -5.591552734375, -5.34521484375, -5.098876953125, -4.8525390625, -4.606201171875, -4.35986328125, -4.113525390625, -3.8671875, -3.620849609375, -3.37451171875, -3.128173828125, -2.8818359375, -2.635498046875, -2.38916015625, -2.142822265625, -1.896484375, -1.650146484375, -1.40380859375, -1.157470703125, -0.9111328125, -0.664794921875, -0.41845703125, -0.172119140625, 0.07421875, 0.320556640625, 0.56689453125, 0.813232421875, 1.0595703125, 1.305908203125, 1.55224609375, 1.798583984375, 2.044921875, 2.291259765625, 2.53759765625, 2.783935546875, 3.0302734375, 3.276611328125, 3.52294921875, 3.769287109375, 4.015625, 4.261962890625, 4.50830078125, 4.754638671875, 5.0009765625, 5.247314453125, 5.49365234375, 5.739990234375, 5.986328125, 6.232666015625, 6.47900390625, 6.725341796875, 6.9716796875, 7.218017578125, 7.46435546875, 7.710693359375, 7.95703125]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 2.0, 2.0, 4.0, 10.0, 6.0, 19.0, 33.0, 52.0, 77.0, 134.0, 179.0, 319.0, 487.0, 851.0, 1322.0, 2164.0, 3688.0, 5878.0, 9609.0, 15912.0, 25330.0, 40164.0, 62846.0, 94193.0, 135710.0, 1100143.0, 250979.0, 120120.0, 82976.0, 53899.0, 34163.0, 21436.0, 13424.0, 8133.0, 4889.0, 3148.0, 1902.0, 1141.0, 707.0, 399.0, 268.0, 134.0, 93.0, 66.0, 43.0, 32.0, 15.0, 20.0, 8.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.65576171875, -0.6363754272460938, -0.6169891357421875, -0.5976028442382812, -0.578216552734375, -0.5588302612304688, -0.5394439697265625, -0.5200576782226562, -0.50067138671875, -0.48128509521484375, -0.4618988037109375, -0.44251251220703125, -0.423126220703125, -0.40373992919921875, -0.3843536376953125, -0.36496734619140625, -0.3455810546875, -0.32619476318359375, -0.3068084716796875, -0.28742218017578125, -0.268035888671875, -0.24864959716796875, -0.2292633056640625, -0.20987701416015625, -0.19049072265625, -0.17110443115234375, -0.1517181396484375, -0.13233184814453125, -0.112945556640625, -0.09355926513671875, -0.0741729736328125, -0.05478668212890625, -0.035400390625, -0.01601409912109375, 0.0033721923828125, 0.02275848388671875, 0.042144775390625, 0.06153106689453125, 0.0809173583984375, 0.10030364990234375, 0.11968994140625, 0.13907623291015625, 0.1584625244140625, 0.17784881591796875, 0.197235107421875, 0.21662139892578125, 0.2360076904296875, 0.25539398193359375, 0.2747802734375, 0.29416656494140625, 0.3135528564453125, 0.33293914794921875, 0.352325439453125, 0.37171173095703125, 0.3910980224609375, 0.41048431396484375, 0.42987060546875, 0.44925689697265625, 0.4686431884765625, 0.48802947998046875, 0.507415771484375, 0.5268020629882812, 0.5461883544921875, 0.5655746459960938, 0.5849609375]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 7.0, 8.0, 11.0, 7.0, 13.0, 12.0, 14.0, 20.0, 23.0, 22.0, 29.0, 35.0, 46.0, 90.0, 93.0, 110.0, 82.0, 81.0, 50.0, 41.0, 34.0, 25.0, 21.0, 15.0, 19.0, 12.0, 13.0, 17.0, 7.0, 10.0, 6.0, 7.0, 5.0, 6.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.032470703125, -0.03144121170043945, -0.030411720275878906, -0.02938222885131836, -0.028352737426757812, -0.027323246002197266, -0.02629375457763672, -0.025264263153076172, -0.024234771728515625, -0.023205280303955078, -0.02217578887939453, -0.021146297454833984, -0.020116806030273438, -0.01908731460571289, -0.018057823181152344, -0.017028331756591797, -0.01599884033203125, -0.014969348907470703, -0.013939857482910156, -0.01291036605834961, -0.011880874633789062, -0.010851383209228516, -0.009821891784667969, -0.008792400360107422, -0.007762908935546875, -0.006733417510986328, -0.005703926086425781, -0.004674434661865234, -0.0036449432373046875, -0.0026154518127441406, -0.0015859603881835938, -0.0005564689636230469, 0.0004730224609375, 0.0015025138854980469, 0.0025320053100585938, 0.0035614967346191406, 0.0045909881591796875, 0.005620479583740234, 0.006649971008300781, 0.007679462432861328, 0.008708953857421875, 0.009738445281982422, 0.010767936706542969, 0.011797428131103516, 0.012826919555664062, 0.01385641098022461, 0.014885902404785156, 0.015915393829345703, 0.01694488525390625, 0.017974376678466797, 0.019003868103027344, 0.02003335952758789, 0.021062850952148438, 0.022092342376708984, 0.02312183380126953, 0.024151325225830078, 0.025180816650390625, 0.026210308074951172, 0.02723979949951172, 0.028269290924072266, 0.029298782348632812, 0.03032827377319336, 0.031357765197753906, 0.03238725662231445, 0.033416748046875]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 1.0, 3.0, 2.0, 6.0, 4.0, 12.0, 10.0, 9.0, 14.0, 20.0, 24.0, 18.0, 34.0, 44.0, 39.0, 65.0, 91.0, 163.0, 329.0, 687.0, 34641.0, 1009761.0, 1539.0, 400.0, 210.0, 122.0, 70.0, 51.0, 35.0, 37.0, 26.0, 22.0, 16.0, 7.0, 13.0, 9.0, 10.0, 4.0, 3.0, 1.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.67138671875, -0.6498870849609375, -0.628387451171875, -0.6068878173828125, -0.58538818359375, -0.5638885498046875, -0.542388916015625, -0.5208892822265625, -0.4993896484375, -0.4778900146484375, -0.456390380859375, -0.4348907470703125, -0.41339111328125, -0.3918914794921875, -0.370391845703125, -0.3488922119140625, -0.327392578125, -0.3058929443359375, -0.284393310546875, -0.2628936767578125, -0.24139404296875, -0.2198944091796875, -0.198394775390625, -0.1768951416015625, -0.1553955078125, -0.1338958740234375, -0.112396240234375, -0.0908966064453125, -0.06939697265625, -0.0478973388671875, -0.026397705078125, -0.0048980712890625, 0.0166015625, 0.0381011962890625, 0.059600830078125, 0.0811004638671875, 0.10260009765625, 0.1240997314453125, 0.145599365234375, 0.1670989990234375, 0.1885986328125, 0.2100982666015625, 0.231597900390625, 0.2530975341796875, 0.27459716796875, 0.2960968017578125, 0.317596435546875, 0.3390960693359375, 0.360595703125, 0.3820953369140625, 0.403594970703125, 0.4250946044921875, 0.44659423828125, 0.4680938720703125, 0.489593505859375, 0.5110931396484375, 0.5325927734375, 0.5540924072265625, 0.575592041015625, 0.5970916748046875, 0.61859130859375, 0.6400909423828125, 0.661590576171875, 0.6830902099609375, 0.70458984375]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [3.0, 102.0, 910.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02921820804476738, -0.01572445034980774, -0.002230694517493248, 0.011263061314821243, 0.024756819009780884, 0.038250576704740524, 0.051744330674409866, 0.0652380883693695, 0.07873184978961945, 0.09222560375928879, 0.10571936517953873, 0.11921311914920807, 0.132706880569458, 0.14620062708854675, 0.1596943885087967, 0.17318814992904663, 0.18668189644813538, 0.20017565786838531, 0.21366940438747406, 0.227163165807724, 0.24065692722797394, 0.2541506886482239, 0.2676444351673126, 0.28113818168640137, 0.2946319580078125, 0.30812570452690125, 0.3216194808483124, 0.3351132273674011, 0.34860697388648987, 0.362100750207901, 0.37559449672698975, 0.3890882730484009, 0.4025820195674896, 0.41607576608657837, 0.4295695424079895, 0.44306328892707825, 0.456557035446167, 0.4700508117675781, 0.48354455828666687, 0.4970383048057556, 0.5105320811271667, 0.5240258574485779, 0.5375195741653442, 0.5510133504867554, 0.5645071268081665, 0.5780008435249329, 0.591494619846344, 0.6049883961677551, 0.6184821128845215, 0.6319758892059326, 0.645469605922699, 0.6589633822441101, 0.6724571585655212, 0.6859508752822876, 0.6994446516036987, 0.7129384279251099, 0.726432204246521, 0.7399259805679321, 0.7534196972846985, 0.7669134736061096, 0.7804072499275208, 0.7939009666442871, 0.8073947429656982, 0.8208885192871094, 0.8343822360038757]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 5.0, 10.0, 30.0, 25.0, 45.0, 63.0, 75.0, 91.0, 103.0, 95.0, 100.0, 91.0, 74.0, 61.0, 47.0, 35.0, 24.0, 24.0, 10.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0597648024559021, -0.058217670768499374, -0.05667053908109665, -0.05512341111898422, -0.0535762794315815, -0.05202914774417877, -0.050482019782066345, -0.04893488809466362, -0.047387756407260895, -0.04584062471985817, -0.044293493032455444, -0.04274636507034302, -0.04119923338294029, -0.03965210169553757, -0.03810497373342514, -0.036557842046022415, -0.03501071035861969, -0.033463578671216965, -0.03191644698381424, -0.030369319021701813, -0.028822187334299088, -0.027275055646896362, -0.025727925822138786, -0.02418079599738121, -0.022633664309978485, -0.02108653262257576, -0.019539402797818184, -0.017992272973060608, -0.016445141285657883, -0.014898010529577732, -0.013350879773497581, -0.011803749017417431, -0.01025661826133728, -0.00870948750525713, -0.007162356749176979, -0.0056152259930968285, -0.004068095237016678, -0.0025209644809365273, -0.0009738337248563766, 0.000573297031223774, 0.0021204277873039246, 0.003667558543384075, 0.005214689299464226, 0.006761820055544376, 0.008308950811624527, 0.009856081567704678, 0.011403212323784828, 0.012950343079864979, 0.01449747383594513, 0.016044605523347855, 0.01759173534810543, 0.019138865172863007, 0.020685996860265732, 0.022233128547668457, 0.023780258372426033, 0.02532738819718361, 0.026874519884586334, 0.02842165157198906, 0.029968781396746635, 0.03151591122150421, 0.03306304290890694, 0.03461017459630966, 0.03615730255842209, 0.037704434245824814, 0.03925156593322754]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 4.0, 3.0, 1.0, 7.0, 10.0, 4.0, 6.0, 9.0, 14.0, 19.0, 22.0, 34.0, 25.0, 15.0, 23.0, 25.0, 36.0, 21.0, 28.0, 49.0, 37.0, 45.0, 32.0, 45.0, 30.0, 50.0, 32.0, 42.0, 34.0, 37.0, 29.0, 31.0, 30.0, 27.0, 25.0, 15.0, 22.0, 14.0, 6.0, 15.0, 9.0, 11.0, 9.0, 8.0, 7.0, 6.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.890625, -10.5458984375, -10.201171875, -9.8564453125, -9.51171875, -9.1669921875, -8.822265625, -8.4775390625, -8.1328125, -7.7880859375, -7.443359375, -7.0986328125, -6.75390625, -6.4091796875, -6.064453125, -5.7197265625, -5.375, -5.0302734375, -4.685546875, -4.3408203125, -3.99609375, -3.6513671875, -3.306640625, -2.9619140625, -2.6171875, -2.2724609375, -1.927734375, -1.5830078125, -1.23828125, -0.8935546875, -0.548828125, -0.2041015625, 0.140625, 0.4853515625, 0.830078125, 1.1748046875, 1.51953125, 1.8642578125, 2.208984375, 2.5537109375, 2.8984375, 3.2431640625, 3.587890625, 3.9326171875, 4.27734375, 4.6220703125, 4.966796875, 5.3115234375, 5.65625, 6.0009765625, 6.345703125, 6.6904296875, 7.03515625, 7.3798828125, 7.724609375, 8.0693359375, 8.4140625, 8.7587890625, 9.103515625, 9.4482421875, 9.79296875, 10.1376953125, 10.482421875, 10.8271484375, 11.171875]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 5.0, 2.0, 3.0, 5.0, 10.0, 7.0, 9.0, 11.0, 15.0, 35.0, 36.0, 56.0, 56.0, 66.0, 87.0, 128.0, 211.0, 441.0, 795.0, 1727.0, 4423.0, 14056.0, 75831.0, 687454.0, 222577.0, 27996.0, 7366.0, 2621.0, 1088.0, 519.0, 260.0, 195.0, 127.0, 94.0, 49.0, 37.0, 39.0, 22.0, 16.0, 18.0, 12.0, 16.0, 9.0, 12.0, 7.0, 7.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.859375, -21.17041015625, -20.4814453125, -19.79248046875, -19.103515625, -18.41455078125, -17.7255859375, -17.03662109375, -16.34765625, -15.65869140625, -14.9697265625, -14.28076171875, -13.591796875, -12.90283203125, -12.2138671875, -11.52490234375, -10.8359375, -10.14697265625, -9.4580078125, -8.76904296875, -8.080078125, -7.39111328125, -6.7021484375, -6.01318359375, -5.32421875, -4.63525390625, -3.9462890625, -3.25732421875, -2.568359375, -1.87939453125, -1.1904296875, -0.50146484375, 0.1875, 0.87646484375, 1.5654296875, 2.25439453125, 2.943359375, 3.63232421875, 4.3212890625, 5.01025390625, 5.69921875, 6.38818359375, 7.0771484375, 7.76611328125, 8.455078125, 9.14404296875, 9.8330078125, 10.52197265625, 11.2109375, 11.89990234375, 12.5888671875, 13.27783203125, 13.966796875, 14.65576171875, 15.3447265625, 16.03369140625, 16.72265625, 17.41162109375, 18.1005859375, 18.78955078125, 19.478515625, 20.16748046875, 20.8564453125, 21.54541015625, 22.234375]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 3.0, 4.0, 5.0, 11.0, 7.0, 18.0, 11.0, 17.0, 18.0, 29.0, 24.0, 29.0, 36.0, 40.0, 37.0, 37.0, 47.0, 58.0, 151.0, 1589.0, 346.0, 105.0, 59.0, 53.0, 43.0, 30.0, 37.0, 43.0, 25.0, 31.0, 22.0, 18.0, 17.0, 6.0, 6.0, 6.0, 8.0, 4.0, 7.0, 6.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.4375, -35.255859375, -34.07421875, -32.892578125, -31.7109375, -30.529296875, -29.34765625, -28.166015625, -26.984375, -25.802734375, -24.62109375, -23.439453125, -22.2578125, -21.076171875, -19.89453125, -18.712890625, -17.53125, -16.349609375, -15.16796875, -13.986328125, -12.8046875, -11.623046875, -10.44140625, -9.259765625, -8.078125, -6.896484375, -5.71484375, -4.533203125, -3.3515625, -2.169921875, -0.98828125, 0.193359375, 1.375, 2.556640625, 3.73828125, 4.919921875, 6.1015625, 7.283203125, 8.46484375, 9.646484375, 10.828125, 12.009765625, 13.19140625, 14.373046875, 15.5546875, 16.736328125, 17.91796875, 19.099609375, 20.28125, 21.462890625, 22.64453125, 23.826171875, 25.0078125, 26.189453125, 27.37109375, 28.552734375, 29.734375, 30.916015625, 32.09765625, 33.279296875, 34.4609375, 35.642578125, 36.82421875, 38.005859375, 39.1875]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 12.0, 2.0, 5.0, 10.0, 4.0, 10.0, 16.0, 18.0, 26.0, 34.0, 44.0, 41.0, 58.0, 83.0, 137.0, 215.0, 459.0, 1746.0, 43342.0, 3082396.0, 14929.0, 1116.0, 341.0, 191.0, 106.0, 92.0, 57.0, 45.0, 36.0, 26.0, 20.0, 19.0, 11.0, 19.0, 10.0, 9.0, 5.0, 5.0, 3.0, 5.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-91.25, -88.515625, -85.78125, -83.046875, -80.3125, -77.578125, -74.84375, -72.109375, -69.375, -66.640625, -63.90625, -61.171875, -58.4375, -55.703125, -52.96875, -50.234375, -47.5, -44.765625, -42.03125, -39.296875, -36.5625, -33.828125, -31.09375, -28.359375, -25.625, -22.890625, -20.15625, -17.421875, -14.6875, -11.953125, -9.21875, -6.484375, -3.75, -1.015625, 1.71875, 4.453125, 7.1875, 9.921875, 12.65625, 15.390625, 18.125, 20.859375, 23.59375, 26.328125, 29.0625, 31.796875, 34.53125, 37.265625, 40.0, 42.734375, 45.46875, 48.203125, 50.9375, 53.671875, 56.40625, 59.140625, 61.875, 64.609375, 67.34375, 70.078125, 72.8125, 75.546875, 78.28125, 81.015625, 83.75]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 8.0, 55.0, 164.0, 283.0, 312.0, 149.0, 32.0, 10.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.134422302246094, -25.317777633666992, -22.50113296508789, -19.684490203857422, -16.86784553527832, -14.051200866699219, -11.23455810546875, -8.417913436889648, -5.601268768310547, -2.7846245765686035, 0.032019615173339844, 2.848663330078125, 5.665307998657227, 8.481952667236328, 11.298595428466797, 14.115240097045898, 16.931884765625, 19.7485294342041, 22.565174102783203, 25.381816864013672, 28.198461532592773, 31.015106201171875, 33.831748962402344, 36.64839172363281, 39.46503829956055, 42.281681060791016, 45.09832763671875, 47.91497039794922, 50.73161315917969, 53.54825973510742, 56.36490249633789, 59.181549072265625, 61.998199462890625, 64.8148422241211, 67.63148498535156, 70.44813537597656, 73.26477813720703, 76.0814208984375, 78.89806365966797, 81.71470642089844, 84.53135681152344, 87.3479995727539, 90.16464233398438, 92.98129272460938, 95.79793548583984, 98.61457824707031, 101.43122100830078, 104.24786376953125, 107.06450653076172, 109.88114929199219, 112.69779205322266, 115.51443481445312, 118.33108520507812, 121.1477279663086, 123.96437072753906, 126.78101348876953, 129.59765625, 132.414306640625, 135.23094177246094, 138.04759216308594, 140.86422729492188, 143.68087768554688, 146.49752807617188, 149.3141632080078, 152.1308135986328]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 2.0, 8.0, 6.0, 8.0, 8.0, 13.0, 17.0, 17.0, 24.0, 19.0, 23.0, 24.0, 32.0, 30.0, 34.0, 36.0, 44.0, 56.0, 43.0, 37.0, 42.0, 61.0, 36.0, 41.0, 44.0, 37.0, 36.0, 37.0, 30.0, 28.0, 16.0, 22.0, 13.0, 22.0, 11.0, 5.0, 4.0, 8.0, 9.0, 4.0, 6.0, 3.0, 1.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-90.42059326171875, -87.60358428955078, -84.78656768798828, -81.96955871582031, -79.15254211425781, -76.33553314208984, -73.51852416992188, -70.70150756835938, -67.8844985961914, -65.06748962402344, -62.25047302246094, -59.43346405029297, -56.616451263427734, -53.7994384765625, -50.98242950439453, -48.1654167175293, -45.34840393066406, -42.53139114379883, -39.714378356933594, -36.897369384765625, -34.08035659790039, -31.263343811035156, -28.446332931518555, -25.629322052001953, -22.81230926513672, -19.995296478271484, -17.178285598754883, -14.361273765563965, -11.544261932373047, -8.727250099182129, -5.910238265991211, -3.0932273864746094, -0.27622222900390625, 2.5407896041870117, 5.35780143737793, 8.174813270568848, 10.991825103759766, 13.808836936950684, 16.6258487701416, 19.442859649658203, 22.259872436523438, 25.076885223388672, 27.893896102905273, 30.710906982421875, 33.52791976928711, 36.344932556152344, 39.16194152832031, 41.97895431518555, 44.79596710205078, 47.612979888916016, 50.42999267578125, 53.24700164794922, 56.06401443481445, 58.88102722167969, 61.698036193847656, 64.51504516601562, 67.33206176757812, 70.1490707397461, 72.9660873413086, 75.78309631347656, 78.60011291503906, 81.41712188720703, 84.234130859375, 87.0511474609375, 89.86815643310547]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 3.0, 7.0, 6.0, 9.0, 8.0, 8.0, 15.0, 13.0, 19.0, 17.0, 24.0, 22.0, 32.0, 26.0, 30.0, 30.0, 38.0, 35.0, 33.0, 37.0, 45.0, 36.0, 42.0, 30.0, 38.0, 38.0, 44.0, 36.0, 32.0, 27.0, 31.0, 26.0, 30.0, 18.0, 24.0, 13.0, 13.0, 13.0, 12.0, 5.0, 10.0, 6.0, 6.0, 7.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-11.8125, -11.454833984375, -11.09716796875, -10.739501953125, -10.3818359375, -10.024169921875, -9.66650390625, -9.308837890625, -8.951171875, -8.593505859375, -8.23583984375, -7.878173828125, -7.5205078125, -7.162841796875, -6.80517578125, -6.447509765625, -6.08984375, -5.732177734375, -5.37451171875, -5.016845703125, -4.6591796875, -4.301513671875, -3.94384765625, -3.586181640625, -3.228515625, -2.870849609375, -2.51318359375, -2.155517578125, -1.7978515625, -1.440185546875, -1.08251953125, -0.724853515625, -0.3671875, -0.009521484375, 0.34814453125, 0.705810546875, 1.0634765625, 1.421142578125, 1.77880859375, 2.136474609375, 2.494140625, 2.851806640625, 3.20947265625, 3.567138671875, 3.9248046875, 4.282470703125, 4.64013671875, 4.997802734375, 5.35546875, 5.713134765625, 6.07080078125, 6.428466796875, 6.7861328125, 7.143798828125, 7.50146484375, 7.859130859375, 8.216796875, 8.574462890625, 8.93212890625, 9.289794921875, 9.6474609375, 10.005126953125, 10.36279296875, 10.720458984375, 11.078125]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 4.0, 2.0, 2.0, 11.0, 9.0, 17.0, 12.0, 22.0, 21.0, 45.0, 42.0, 74.0, 111.0, 183.0, 261.0, 539.0, 951.0, 2039.0, 4840.0, 14323.0, 58004.0, 370185.0, 2078485.0, 1411243.0, 199150.0, 36435.0, 10171.0, 3654.0, 1608.0, 773.0, 417.0, 244.0, 121.0, 76.0, 49.0, 46.0, 31.0, 18.0, 9.0, 13.0, 10.0, 10.0, 5.0, 6.0, 4.0, 6.0, 7.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-23.78125, -23.07861328125, -22.3759765625, -21.67333984375, -20.970703125, -20.26806640625, -19.5654296875, -18.86279296875, -18.16015625, -17.45751953125, -16.7548828125, -16.05224609375, -15.349609375, -14.64697265625, -13.9443359375, -13.24169921875, -12.5390625, -11.83642578125, -11.1337890625, -10.43115234375, -9.728515625, -9.02587890625, -8.3232421875, -7.62060546875, -6.91796875, -6.21533203125, -5.5126953125, -4.81005859375, -4.107421875, -3.40478515625, -2.7021484375, -1.99951171875, -1.296875, -0.59423828125, 0.1083984375, 0.81103515625, 1.513671875, 2.21630859375, 2.9189453125, 3.62158203125, 4.32421875, 5.02685546875, 5.7294921875, 6.43212890625, 7.134765625, 7.83740234375, 8.5400390625, 9.24267578125, 9.9453125, 10.64794921875, 11.3505859375, 12.05322265625, 12.755859375, 13.45849609375, 14.1611328125, 14.86376953125, 15.56640625, 16.26904296875, 16.9716796875, 17.67431640625, 18.376953125, 19.07958984375, 19.7822265625, 20.48486328125, 21.1875]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 4.0, 7.0, 9.0, 9.0, 16.0, 24.0, 33.0, 32.0, 43.0, 50.0, 98.0, 103.0, 156.0, 165.0, 245.0, 293.0, 408.0, 441.0, 443.0, 360.0, 278.0, 238.0, 147.0, 123.0, 81.0, 80.0, 48.0, 34.0, 28.0, 27.0, 11.0, 17.0, 8.0, 6.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-19.234375, -18.680419921875, -18.12646484375, -17.572509765625, -17.0185546875, -16.464599609375, -15.91064453125, -15.356689453125, -14.802734375, -14.248779296875, -13.69482421875, -13.140869140625, -12.5869140625, -12.032958984375, -11.47900390625, -10.925048828125, -10.37109375, -9.817138671875, -9.26318359375, -8.709228515625, -8.1552734375, -7.601318359375, -7.04736328125, -6.493408203125, -5.939453125, -5.385498046875, -4.83154296875, -4.277587890625, -3.7236328125, -3.169677734375, -2.61572265625, -2.061767578125, -1.5078125, -0.953857421875, -0.39990234375, 0.154052734375, 0.7080078125, 1.261962890625, 1.81591796875, 2.369873046875, 2.923828125, 3.477783203125, 4.03173828125, 4.585693359375, 5.1396484375, 5.693603515625, 6.24755859375, 6.801513671875, 7.35546875, 7.909423828125, 8.46337890625, 9.017333984375, 9.5712890625, 10.125244140625, 10.67919921875, 11.233154296875, 11.787109375, 12.341064453125, 12.89501953125, 13.448974609375, 14.0029296875, 14.556884765625, 15.11083984375, 15.664794921875, 16.21875]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 2.0, 2.0, 4.0, 5.0, 3.0, 4.0, 6.0, 9.0, 14.0, 17.0, 29.0, 22.0, 27.0, 48.0, 56.0, 84.0, 102.0, 126.0, 184.0, 245.0, 453.0, 854.0, 2509.0, 11798.0, 96414.0, 1602714.0, 2322154.0, 135246.0, 15605.0, 3027.0, 997.0, 437.0, 277.0, 191.0, 126.0, 88.0, 87.0, 64.0, 68.0, 34.0, 46.0, 19.0, 18.0, 16.0, 13.0, 11.0, 5.0, 8.0, 6.0, 3.0, 1.0, 5.0, 4.0, 1.0, 1.0, 3.0, 1.0], "bins": [-43.9375, -42.60888671875, -41.2802734375, -39.95166015625, -38.623046875, -37.29443359375, -35.9658203125, -34.63720703125, -33.30859375, -31.97998046875, -30.6513671875, -29.32275390625, -27.994140625, -26.66552734375, -25.3369140625, -24.00830078125, -22.6796875, -21.35107421875, -20.0224609375, -18.69384765625, -17.365234375, -16.03662109375, -14.7080078125, -13.37939453125, -12.05078125, -10.72216796875, -9.3935546875, -8.06494140625, -6.736328125, -5.40771484375, -4.0791015625, -2.75048828125, -1.421875, -0.09326171875, 1.2353515625, 2.56396484375, 3.892578125, 5.22119140625, 6.5498046875, 7.87841796875, 9.20703125, 10.53564453125, 11.8642578125, 13.19287109375, 14.521484375, 15.85009765625, 17.1787109375, 18.50732421875, 19.8359375, 21.16455078125, 22.4931640625, 23.82177734375, 25.150390625, 26.47900390625, 27.8076171875, 29.13623046875, 30.46484375, 31.79345703125, 33.1220703125, 34.45068359375, 35.779296875, 37.10791015625, 38.4365234375, 39.76513671875, 41.09375]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 12.0, 141.0, 470.0, 337.0, 50.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-589.5473022460938, -577.4707641601562, -565.3941650390625, -553.317626953125, -541.2410278320312, -529.1644897460938, -517.087890625, -505.0113525390625, -492.934814453125, -480.8582458496094, -468.78167724609375, -456.70513916015625, -444.6285705566406, -432.552001953125, -420.4754333496094, -408.39886474609375, -396.3222961425781, -384.2457275390625, -372.1691589355469, -360.09259033203125, -348.01605224609375, -335.9394836425781, -323.8629150390625, -311.7863464355469, -299.70977783203125, -287.6332092285156, -275.556640625, -263.4801025390625, -251.40353393554688, -239.32696533203125, -227.25039672851562, -215.173828125, -203.0972900390625, -191.02072143554688, -178.9441680908203, -166.8675994873047, -154.79104614257812, -142.7144775390625, -130.63790893554688, -118.56134796142578, -106.48478698730469, -94.4082260131836, -82.3316650390625, -70.25509643554688, -58.17853546142578, -46.10197448730469, -34.02540588378906, -21.94884490966797, -9.872283935546875, 2.2042789459228516, 14.280841827392578, 26.357406616210938, 38.43396759033203, 50.510528564453125, 62.58709716796875, 74.66365814208984, 86.74021911621094, 98.81678009033203, 110.89334106445312, 122.96990966796875, 135.04647827148438, 147.12303161621094, 159.19960021972656, 171.27615356445312, 183.35272216796875]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 3.0, 3.0, 5.0, 6.0, 8.0, 7.0, 12.0, 12.0, 13.0, 20.0, 23.0, 19.0, 26.0, 43.0, 36.0, 31.0, 42.0, 41.0, 47.0, 33.0, 49.0, 48.0, 67.0, 36.0, 45.0, 41.0, 37.0, 40.0, 28.0, 30.0, 27.0, 24.0, 20.0, 18.0, 19.0, 11.0, 6.0, 7.0, 7.0, 4.0, 6.0, 3.0, 4.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-81.32589721679688, -79.14510345458984, -76.96430969238281, -74.78352355957031, -72.60272979736328, -70.42193603515625, -68.24114227294922, -66.06034851074219, -63.87955856323242, -61.69876480102539, -59.517974853515625, -57.337181091308594, -55.15638732910156, -52.9755973815918, -50.794803619384766, -48.614013671875, -46.43321990966797, -44.25242614746094, -42.07163619995117, -39.89084243774414, -37.710052490234375, -35.529258728027344, -33.34846496582031, -31.167673110961914, -28.986881256103516, -26.806089401245117, -24.62529754638672, -22.444503784179688, -20.26371192932129, -18.08292007446289, -15.902127265930176, -13.721334457397461, -11.540542602539062, -9.359750747680664, -7.178957939147949, -4.998165607452393, -2.817373275756836, -0.6365814208984375, 1.5442113876342773, 3.725004196166992, 5.905796051025391, 8.086587905883789, 10.267380714416504, 12.448173522949219, 14.628965377807617, 16.809757232666016, 18.990550994873047, 21.171342849731445, 23.352134704589844, 25.532926559448242, 27.71371841430664, 29.894512176513672, 32.07530212402344, 34.25609588623047, 36.4368896484375, 38.61768341064453, 40.7984733581543, 42.97926712036133, 45.160057067871094, 47.340850830078125, 49.521644592285156, 51.70243453979492, 53.88322830200195, 56.06401824951172, 58.24481201171875]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 5.0, 3.0, 4.0, 9.0, 7.0, 7.0, 7.0, 11.0, 15.0, 15.0, 14.0, 28.0, 28.0, 19.0, 22.0, 29.0, 34.0, 35.0, 30.0, 42.0, 50.0, 35.0, 42.0, 55.0, 41.0, 39.0, 35.0, 34.0, 40.0, 30.0, 34.0, 26.0, 26.0, 18.0, 17.0, 16.0, 18.0, 20.0, 12.0, 12.0, 15.0, 6.0, 6.0, 7.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-13.1953125, -12.8187255859375, -12.442138671875, -12.0655517578125, -11.68896484375, -11.3123779296875, -10.935791015625, -10.5592041015625, -10.1826171875, -9.8060302734375, -9.429443359375, -9.0528564453125, -8.67626953125, -8.2996826171875, -7.923095703125, -7.5465087890625, -7.169921875, -6.7933349609375, -6.416748046875, -6.0401611328125, -5.66357421875, -5.2869873046875, -4.910400390625, -4.5338134765625, -4.1572265625, -3.7806396484375, -3.404052734375, -3.0274658203125, -2.65087890625, -2.2742919921875, -1.897705078125, -1.5211181640625, -1.14453125, -0.7679443359375, -0.391357421875, -0.0147705078125, 0.36181640625, 0.7384033203125, 1.114990234375, 1.4915771484375, 1.8681640625, 2.2447509765625, 2.621337890625, 2.9979248046875, 3.37451171875, 3.7510986328125, 4.127685546875, 4.5042724609375, 4.880859375, 5.2574462890625, 5.634033203125, 6.0106201171875, 6.38720703125, 6.7637939453125, 7.140380859375, 7.5169677734375, 7.8935546875, 8.2701416015625, 8.646728515625, 9.0233154296875, 9.39990234375, 9.7764892578125, 10.153076171875, 10.5296630859375, 10.90625]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 10.0, 10.0, 18.0, 22.0, 39.0, 59.0, 74.0, 125.0, 199.0, 276.0, 436.0, 688.0, 1164.0, 1725.0, 2825.0, 4342.0, 6954.0, 11448.0, 18401.0, 29855.0, 48016.0, 75324.0, 114047.0, 155156.0, 170827.0, 140865.0, 97641.0, 63341.0, 39509.0, 24821.0, 15110.0, 9416.0, 5826.0, 3546.0, 2371.0, 1387.0, 939.0, 597.0, 356.0, 270.0, 183.0, 110.0, 67.0, 50.0, 36.0, 30.0, 14.0, 12.0, 6.0, 5.0, 4.0, 4.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.8603515625, -0.8337173461914062, -0.8070831298828125, -0.7804489135742188, -0.753814697265625, -0.7271804809570312, -0.7005462646484375, -0.6739120483398438, -0.64727783203125, -0.6206436157226562, -0.5940093994140625, -0.5673751831054688, -0.540740966796875, -0.5141067504882812, -0.4874725341796875, -0.46083831787109375, -0.4342041015625, -0.40756988525390625, -0.3809356689453125, -0.35430145263671875, -0.327667236328125, -0.30103302001953125, -0.2743988037109375, -0.24776458740234375, -0.22113037109375, -0.19449615478515625, -0.1678619384765625, -0.14122772216796875, -0.114593505859375, -0.08795928955078125, -0.0613250732421875, -0.03469085693359375, -0.008056640625, 0.01857757568359375, 0.0452117919921875, 0.07184600830078125, 0.098480224609375, 0.12511444091796875, 0.1517486572265625, 0.17838287353515625, 0.20501708984375, 0.23165130615234375, 0.2582855224609375, 0.28491973876953125, 0.311553955078125, 0.33818817138671875, 0.3648223876953125, 0.39145660400390625, 0.4180908203125, 0.44472503662109375, 0.4713592529296875, 0.49799346923828125, 0.524627685546875, 0.5512619018554688, 0.5778961181640625, 0.6045303344726562, 0.63116455078125, 0.6577987670898438, 0.6844329833984375, 0.7110671997070312, 0.737701416015625, 0.7643356323242188, 0.7909698486328125, 0.8176040649414062, 0.84423828125]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 3.0, 3.0, 7.0, 4.0, 5.0, 11.0, 7.0, 12.0, 7.0, 26.0, 27.0, 27.0, 17.0, 32.0, 16.0, 28.0, 30.0, 33.0, 37.0, 39.0, 30.0, 31.0, 39.0, 1061.0, 40.0, 35.0, 30.0, 39.0, 28.0, 33.0, 27.0, 31.0, 30.0, 28.0, 25.0, 20.0, 19.0, 14.0, 17.0, 18.0, 17.0, 10.0, 6.0, 5.0, 9.0, 5.0, 2.0, 3.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-7.33984375, -7.11376953125, -6.8876953125, -6.66162109375, -6.435546875, -6.20947265625, -5.9833984375, -5.75732421875, -5.53125, -5.30517578125, -5.0791015625, -4.85302734375, -4.626953125, -4.40087890625, -4.1748046875, -3.94873046875, -3.72265625, -3.49658203125, -3.2705078125, -3.04443359375, -2.818359375, -2.59228515625, -2.3662109375, -2.14013671875, -1.9140625, -1.68798828125, -1.4619140625, -1.23583984375, -1.009765625, -0.78369140625, -0.5576171875, -0.33154296875, -0.10546875, 0.12060546875, 0.3466796875, 0.57275390625, 0.798828125, 1.02490234375, 1.2509765625, 1.47705078125, 1.703125, 1.92919921875, 2.1552734375, 2.38134765625, 2.607421875, 2.83349609375, 3.0595703125, 3.28564453125, 3.51171875, 3.73779296875, 3.9638671875, 4.18994140625, 4.416015625, 4.64208984375, 4.8681640625, 5.09423828125, 5.3203125, 5.54638671875, 5.7724609375, 5.99853515625, 6.224609375, 6.45068359375, 6.6767578125, 6.90283203125, 7.12890625]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 8.0, 11.0, 20.0, 38.0, 39.0, 59.0, 120.0, 138.0, 220.0, 318.0, 581.0, 985.0, 1612.0, 2624.0, 4177.0, 6874.0, 10952.0, 18170.0, 28486.0, 45229.0, 69643.0, 103279.0, 139800.0, 1195689.0, 151019.0, 109768.0, 75819.0, 48873.0, 31402.0, 19461.0, 12141.0, 7588.0, 4554.0, 2838.0, 1669.0, 1076.0, 665.0, 437.0, 257.0, 169.0, 100.0, 80.0, 48.0, 34.0, 21.0, 12.0, 8.0, 11.0, 5.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.59619140625, -0.5767059326171875, -0.557220458984375, -0.5377349853515625, -0.51824951171875, -0.4987640380859375, -0.479278564453125, -0.4597930908203125, -0.4403076171875, -0.4208221435546875, -0.401336669921875, -0.3818511962890625, -0.36236572265625, -0.3428802490234375, -0.323394775390625, -0.3039093017578125, -0.284423828125, -0.2649383544921875, -0.245452880859375, -0.2259674072265625, -0.20648193359375, -0.1869964599609375, -0.167510986328125, -0.1480255126953125, -0.1285400390625, -0.1090545654296875, -0.089569091796875, -0.0700836181640625, -0.05059814453125, -0.0311126708984375, -0.011627197265625, 0.0078582763671875, 0.02734375, 0.0468292236328125, 0.066314697265625, 0.0858001708984375, 0.10528564453125, 0.1247711181640625, 0.144256591796875, 0.1637420654296875, 0.1832275390625, 0.2027130126953125, 0.222198486328125, 0.2416839599609375, 0.26116943359375, 0.2806549072265625, 0.300140380859375, 0.3196258544921875, 0.339111328125, 0.3585968017578125, 0.378082275390625, 0.3975677490234375, 0.41705322265625, 0.4365386962890625, 0.456024169921875, 0.4755096435546875, 0.4949951171875, 0.5144805908203125, 0.533966064453125, 0.5534515380859375, 0.57293701171875, 0.5924224853515625, 0.611907958984375, 0.6313934326171875, 0.65087890625]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 4.0, 2.0, 2.0, 2.0, 6.0, 9.0, 5.0, 11.0, 12.0, 17.0, 14.0, 25.0, 33.0, 39.0, 39.0, 52.0, 54.0, 61.0, 82.0, 68.0, 76.0, 75.0, 53.0, 52.0, 32.0, 29.0, 24.0, 21.0, 14.0, 16.0, 14.0, 10.0, 5.0, 5.0, 12.0, 9.0, 3.0, 5.0, 4.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.016021728515625, -0.0155181884765625, -0.0150146484375, -0.0145111083984375, -0.014007568359375, -0.0135040283203125, -0.01300048828125, -0.0124969482421875, -0.011993408203125, -0.0114898681640625, -0.010986328125, -0.0104827880859375, -0.009979248046875, -0.0094757080078125, -0.00897216796875, -0.0084686279296875, -0.007965087890625, -0.0074615478515625, -0.0069580078125, -0.0064544677734375, -0.005950927734375, -0.0054473876953125, -0.00494384765625, -0.0044403076171875, -0.003936767578125, -0.0034332275390625, -0.0029296875, -0.0024261474609375, -0.001922607421875, -0.0014190673828125, -0.00091552734375, -0.0004119873046875, 9.1552734375e-05, 0.0005950927734375, 0.0010986328125, 0.0016021728515625, 0.002105712890625, 0.0026092529296875, 0.00311279296875, 0.0036163330078125, 0.004119873046875, 0.0046234130859375, 0.005126953125, 0.0056304931640625, 0.006134033203125, 0.0066375732421875, 0.00714111328125, 0.0076446533203125, 0.008148193359375, 0.0086517333984375, 0.0091552734375, 0.0096588134765625, 0.010162353515625, 0.0106658935546875, 0.01116943359375, 0.0116729736328125, 0.012176513671875, 0.0126800537109375, 0.01318359375, 0.0136871337890625, 0.014190673828125, 0.0146942138671875, 0.01519775390625, 0.0157012939453125, 0.016204833984375]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 5.0, 2.0, 6.0, 8.0, 4.0, 11.0, 10.0, 12.0, 8.0, 19.0, 24.0, 30.0, 34.0, 50.0, 60.0, 81.0, 148.0, 241.0, 669.0, 14343.0, 985081.0, 45709.0, 1058.0, 307.0, 171.0, 111.0, 88.0, 65.0, 45.0, 31.0, 24.0, 14.0, 20.0, 16.0, 7.0, 5.0, 5.0, 7.0, 7.0, 4.0, 5.0, 7.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.341064453125, -0.3306083679199219, -0.32015228271484375, -0.3096961975097656, -0.2992401123046875, -0.2887840270996094, -0.27832794189453125, -0.2678718566894531, -0.257415771484375, -0.24695968627929688, -0.23650360107421875, -0.22604751586914062, -0.2155914306640625, -0.20513534545898438, -0.19467926025390625, -0.18422317504882812, -0.17376708984375, -0.16331100463867188, -0.15285491943359375, -0.14239883422851562, -0.1319427490234375, -0.12148666381835938, -0.11103057861328125, -0.10057449340820312, -0.090118408203125, -0.07966232299804688, -0.06920623779296875, -0.058750152587890625, -0.0482940673828125, -0.037837982177734375, -0.02738189697265625, -0.016925811767578125, -0.0064697265625, 0.003986358642578125, 0.01444244384765625, 0.024898529052734375, 0.0353546142578125, 0.045810699462890625, 0.05626678466796875, 0.06672286987304688, 0.077178955078125, 0.08763504028320312, 0.09809112548828125, 0.10854721069335938, 0.1190032958984375, 0.12945938110351562, 0.13991546630859375, 0.15037155151367188, 0.16082763671875, 0.17128372192382812, 0.18173980712890625, 0.19219589233398438, 0.2026519775390625, 0.21310806274414062, 0.22356414794921875, 0.23402023315429688, 0.244476318359375, 0.2549324035644531, 0.26538848876953125, 0.2758445739746094, 0.2863006591796875, 0.2967567443847656, 0.30721282958984375, 0.3176689147949219, 0.328125]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [44.0, 787.0, 184.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007597451563924551, -0.0031124460510909557, 0.0013725594617426395, 0.005857564974576235, 0.010342570021748543, 0.014827575534582138, 0.019312581047415733, 0.023797588422894478, 0.028282592073082924, 0.03276759758591652, 0.037252604961395264, 0.04173760861158371, 0.046222612261772156, 0.0507076196372509, 0.055192627012729645, 0.05967763066291809, 0.06416263431310654, 0.06864763796329498, 0.07313264906406403, 0.07761765271425247, 0.08210265636444092, 0.08658766001462936, 0.09107266366481781, 0.09555767476558685, 0.1000426784157753, 0.10452768206596375, 0.10901269316673279, 0.11349769681692123, 0.11798270046710968, 0.12246770411729813, 0.12695270776748657, 0.13143771886825562, 0.13592272996902466, 0.1404077410697937, 0.14489273726940155, 0.1493777483701706, 0.15386274456977844, 0.15834775567054749, 0.16283276677131653, 0.16731777787208557, 0.17180277407169342, 0.17628778517246246, 0.1807727813720703, 0.18525779247283936, 0.1897428035736084, 0.19422779977321625, 0.1987128108739853, 0.20319780707359314, 0.20768281817436218, 0.21216782927513123, 0.21665282547473907, 0.22113783657550812, 0.22562283277511597, 0.230107843875885, 0.23459285497665405, 0.2390778660774231, 0.24356286227703094, 0.2480478733778, 0.25253286957740784, 0.2570178806781769, 0.2615028917789459, 0.26598790287971497, 0.2704728841781616, 0.27495789527893066, 0.2794429063796997]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 5.0, 3.0, 14.0, 17.0, 13.0, 27.0, 24.0, 21.0, 33.0, 34.0, 52.0, 45.0, 38.0, 48.0, 61.0, 60.0, 46.0, 68.0, 58.0, 42.0, 38.0, 43.0, 38.0, 40.0, 25.0, 27.0, 21.0, 21.0, 10.0, 10.0, 7.0, 4.0, 1.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.014806628227233887, -0.014411944895982742, -0.014017261564731598, -0.013622578233480453, -0.013227894902229309, -0.012833211570978165, -0.01243852823972702, -0.012043844908475876, -0.011649161577224731, -0.011254478245973587, -0.010859794914722443, -0.010465111583471298, -0.010070428252220154, -0.00967574492096901, -0.009281061589717865, -0.00888637825846672, -0.008491694927215576, -0.008097011595964432, -0.007702328264713287, -0.007307644933462143, -0.0069129616022109985, -0.006518278270959854, -0.00612359493970871, -0.005728911608457565, -0.005334228277206421, -0.0049395449459552765, -0.004544861614704132, -0.004150178283452988, -0.0037554949522018433, -0.003360811620950699, -0.0029661282896995544, -0.00257144495844841, -0.0021767616271972656, -0.0017820782959461212, -0.0013873949646949768, -0.0009927116334438324, -0.000598028302192688, -0.00020334497094154358, 0.00019133836030960083, 0.0005860216915607452, 0.0009807050228118896, 0.001375388354063034, 0.0017700716853141785, 0.002164755016565323, 0.0025594383478164673, 0.0029541216790676117, 0.003348805010318756, 0.0037434883415699005, 0.004138171672821045, 0.004532855004072189, 0.004927538335323334, 0.005322221666574478, 0.0057169049978256226, 0.006111588329076767, 0.006506271660327911, 0.006900954991579056, 0.0072956383228302, 0.007690321654081345, 0.008085004985332489, 0.008479688316583633, 0.008874371647834778, 0.009269054979085922, 0.009663738310337067, 0.010058421641588211, 0.010453104972839355]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 5.0, 3.0, 4.0, 9.0, 6.0, 8.0, 7.0, 11.0, 15.0, 15.0, 14.0, 28.0, 27.0, 20.0, 22.0, 29.0, 33.0, 36.0, 30.0, 42.0, 49.0, 36.0, 41.0, 56.0, 39.0, 40.0, 36.0, 33.0, 41.0, 30.0, 34.0, 26.0, 26.0, 18.0, 17.0, 16.0, 18.0, 20.0, 12.0, 12.0, 15.0, 6.0, 6.0, 7.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-13.203125, -12.826416015625, -12.44970703125, -12.072998046875, -11.6962890625, -11.319580078125, -10.94287109375, -10.566162109375, -10.189453125, -9.812744140625, -9.43603515625, -9.059326171875, -8.6826171875, -8.305908203125, -7.92919921875, -7.552490234375, -7.17578125, -6.799072265625, -6.42236328125, -6.045654296875, -5.6689453125, -5.292236328125, -4.91552734375, -4.538818359375, -4.162109375, -3.785400390625, -3.40869140625, -3.031982421875, -2.6552734375, -2.278564453125, -1.90185546875, -1.525146484375, -1.1484375, -0.771728515625, -0.39501953125, -0.018310546875, 0.3583984375, 0.735107421875, 1.11181640625, 1.488525390625, 1.865234375, 2.241943359375, 2.61865234375, 2.995361328125, 3.3720703125, 3.748779296875, 4.12548828125, 4.502197265625, 4.87890625, 5.255615234375, 5.63232421875, 6.009033203125, 6.3857421875, 6.762451171875, 7.13916015625, 7.515869140625, 7.892578125, 8.269287109375, 8.64599609375, 9.022705078125, 9.3994140625, 9.776123046875, 10.15283203125, 10.529541015625, 10.90625]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 7.0, 4.0, 5.0, 7.0, 8.0, 15.0, 14.0, 14.0, 16.0, 29.0, 38.0, 44.0, 60.0, 87.0, 134.0, 147.0, 216.0, 302.0, 442.0, 608.0, 1177.0, 2688.0, 8225.0, 34735.0, 410600.0, 534583.0, 39089.0, 8974.0, 2857.0, 1201.0, 684.0, 391.0, 307.0, 189.0, 163.0, 107.0, 77.0, 72.0, 55.0, 46.0, 37.0, 30.0, 23.0, 11.0, 12.0, 12.0, 6.0, 5.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-32.9375, -31.997314453125, -31.05712890625, -30.116943359375, -29.1767578125, -28.236572265625, -27.29638671875, -26.356201171875, -25.416015625, -24.475830078125, -23.53564453125, -22.595458984375, -21.6552734375, -20.715087890625, -19.77490234375, -18.834716796875, -17.89453125, -16.954345703125, -16.01416015625, -15.073974609375, -14.1337890625, -13.193603515625, -12.25341796875, -11.313232421875, -10.373046875, -9.432861328125, -8.49267578125, -7.552490234375, -6.6123046875, -5.672119140625, -4.73193359375, -3.791748046875, -2.8515625, -1.911376953125, -0.97119140625, -0.031005859375, 0.9091796875, 1.849365234375, 2.78955078125, 3.729736328125, 4.669921875, 5.610107421875, 6.55029296875, 7.490478515625, 8.4306640625, 9.370849609375, 10.31103515625, 11.251220703125, 12.19140625, 13.131591796875, 14.07177734375, 15.011962890625, 15.9521484375, 16.892333984375, 17.83251953125, 18.772705078125, 19.712890625, 20.653076171875, 21.59326171875, 22.533447265625, 23.4736328125, 24.413818359375, 25.35400390625, 26.294189453125, 27.234375]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 3.0, 6.0, 8.0, 3.0, 8.0, 12.0, 10.0, 16.0, 18.0, 15.0, 19.0, 33.0, 18.0, 31.0, 45.0, 37.0, 37.0, 36.0, 61.0, 75.0, 285.0, 1661.0, 137.0, 78.0, 57.0, 34.0, 51.0, 36.0, 34.0, 28.0, 20.0, 32.0, 11.0, 14.0, 11.0, 15.0, 16.0, 9.0, 7.0, 7.0, 5.0, 0.0, 7.0, 2.0, 1.0, 4.0, 0.0, 2.0, 1.0], "bins": [-39.40625, -38.319091796875, -37.23193359375, -36.144775390625, -35.0576171875, -33.970458984375, -32.88330078125, -31.796142578125, -30.708984375, -29.621826171875, -28.53466796875, -27.447509765625, -26.3603515625, -25.273193359375, -24.18603515625, -23.098876953125, -22.01171875, -20.924560546875, -19.83740234375, -18.750244140625, -17.6630859375, -16.575927734375, -15.48876953125, -14.401611328125, -13.314453125, -12.227294921875, -11.14013671875, -10.052978515625, -8.9658203125, -7.878662109375, -6.79150390625, -5.704345703125, -4.6171875, -3.530029296875, -2.44287109375, -1.355712890625, -0.2685546875, 0.818603515625, 1.90576171875, 2.992919921875, 4.080078125, 5.167236328125, 6.25439453125, 7.341552734375, 8.4287109375, 9.515869140625, 10.60302734375, 11.690185546875, 12.77734375, 13.864501953125, 14.95166015625, 16.038818359375, 17.1259765625, 18.213134765625, 19.30029296875, 20.387451171875, 21.474609375, 22.561767578125, 23.64892578125, 24.736083984375, 25.8232421875, 26.910400390625, 27.99755859375, 29.084716796875, 30.171875]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 4.0, 5.0, 4.0, 1.0, 7.0, 8.0, 4.0, 10.0, 16.0, 15.0, 14.0, 18.0, 15.0, 42.0, 24.0, 35.0, 51.0, 77.0, 102.0, 149.0, 314.0, 956.0, 22321.0, 3098405.0, 21296.0, 949.0, 295.0, 132.0, 92.0, 67.0, 46.0, 43.0, 37.0, 32.0, 16.0, 20.0, 22.0, 16.0, 8.0, 8.0, 7.0, 7.0, 8.0, 5.0, 4.0, 3.0, 3.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-82.1875, -79.1982421875, -76.208984375, -73.2197265625, -70.23046875, -67.2412109375, -64.251953125, -61.2626953125, -58.2734375, -55.2841796875, -52.294921875, -49.3056640625, -46.31640625, -43.3271484375, -40.337890625, -37.3486328125, -34.359375, -31.3701171875, -28.380859375, -25.3916015625, -22.40234375, -19.4130859375, -16.423828125, -13.4345703125, -10.4453125, -7.4560546875, -4.466796875, -1.4775390625, 1.51171875, 4.5009765625, 7.490234375, 10.4794921875, 13.46875, 16.4580078125, 19.447265625, 22.4365234375, 25.42578125, 28.4150390625, 31.404296875, 34.3935546875, 37.3828125, 40.3720703125, 43.361328125, 46.3505859375, 49.33984375, 52.3291015625, 55.318359375, 58.3076171875, 61.296875, 64.2861328125, 67.275390625, 70.2646484375, 73.25390625, 76.2431640625, 79.232421875, 82.2216796875, 85.2109375, 88.2001953125, 91.189453125, 94.1787109375, 97.16796875, 100.1572265625, 103.146484375, 106.1357421875, 109.125]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 23.0, 354.0, 555.0, 80.0, 6.0], "bins": [-367.01678466796875, -361.0179443359375, -355.01910400390625, -349.0202331542969, -343.0213928222656, -337.0225524902344, -331.0237121582031, -325.0248718261719, -319.0260009765625, -313.02716064453125, -307.0283203125, -301.0294494628906, -295.0306091308594, -289.0317687988281, -283.0329284667969, -277.0340881347656, -271.0352478027344, -265.0364074707031, -259.0375671386719, -253.03871154785156, -247.03985595703125, -241.041015625, -235.04217529296875, -229.04331970214844, -223.04446411132812, -217.04562377929688, -211.04676818847656, -205.0479278564453, -199.049072265625, -193.05023193359375, -187.0513916015625, -181.0525360107422, -175.0537109375, -169.05487060546875, -163.05601501464844, -157.0571746826172, -151.05831909179688, -145.05947875976562, -139.06063842773438, -133.06178283691406, -127.06293487548828, -121.0640869140625, -115.06523895263672, -109.06639099121094, -103.06755065917969, -97.0687026977539, -91.06985473632812, -85.07101440429688, -79.07215881347656, -73.07331085205078, -67.074462890625, -61.075618743896484, -55.07677459716797, -49.07792663574219, -43.079078674316406, -37.08023452758789, -31.081388473510742, -25.082542419433594, -19.083694458007812, -13.084848403930664, -7.086002349853516, -1.0871562957763672, 4.911691665649414, 10.91053581237793, 16.90938377380371]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 4.0, 4.0, 7.0, 5.0, 15.0, 4.0, 7.0, 8.0, 13.0, 24.0, 26.0, 30.0, 29.0, 31.0, 35.0, 36.0, 50.0, 30.0, 45.0, 39.0, 32.0, 54.0, 57.0, 38.0, 30.0, 37.0, 34.0, 36.0, 26.0, 29.0, 27.0, 32.0, 28.0, 24.0, 19.0, 12.0, 14.0, 6.0, 7.0, 7.0, 8.0, 2.0, 5.0, 5.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.04960632324219, -78.2597427368164, -75.46987915039062, -72.68001556396484, -69.89015197753906, -67.10028839111328, -64.3104248046875, -61.520565032958984, -58.7307014465332, -55.94083786010742, -53.15097427368164, -50.361114501953125, -47.571250915527344, -44.78138732910156, -41.99152374267578, -39.20166015625, -36.41179656982422, -33.62193298339844, -30.832069396972656, -28.042207717895508, -25.252344131469727, -22.462480545043945, -19.672618865966797, -16.882755279541016, -14.092891693115234, -11.303028106689453, -8.513165473937988, -5.723302841186523, -2.933439254760742, -0.14357566833496094, 2.6462860107421875, 5.436149597167969, 8.22601318359375, 11.015876770019531, 13.805739402770996, 16.59560203552246, 19.385465621948242, 22.175329208374023, 24.965190887451172, 27.755054473876953, 30.544918060302734, 33.334781646728516, 36.1246452331543, 38.91450500488281, 41.704368591308594, 44.494232177734375, 47.284095764160156, 50.07395935058594, 52.86382293701172, 55.6536865234375, 58.44355010986328, 61.23341369628906, 64.02327728271484, 66.81314086914062, 69.60299682617188, 72.39286804199219, 75.18272399902344, 77.97258758544922, 80.762451171875, 83.55231475830078, 86.34217834472656, 89.13204193115234, 91.92190551757812, 94.71176147460938, 97.50163269042969]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 8.0, 7.0, 11.0, 7.0, 6.0, 18.0, 12.0, 21.0, 21.0, 19.0, 20.0, 25.0, 23.0, 29.0, 29.0, 45.0, 46.0, 39.0, 33.0, 53.0, 33.0, 43.0, 45.0, 46.0, 35.0, 37.0, 30.0, 35.0, 29.0, 29.0, 19.0, 20.0, 20.0, 20.0, 13.0, 16.0, 10.0, 7.0, 14.0, 12.0, 6.0, 1.0, 2.0, 5.0, 0.0, 2.0, 2.0, 0.0, 3.0], "bins": [-13.71875, -13.333740234375, -12.94873046875, -12.563720703125, -12.1787109375, -11.793701171875, -11.40869140625, -11.023681640625, -10.638671875, -10.253662109375, -9.86865234375, -9.483642578125, -9.0986328125, -8.713623046875, -8.32861328125, -7.943603515625, -7.55859375, -7.173583984375, -6.78857421875, -6.403564453125, -6.0185546875, -5.633544921875, -5.24853515625, -4.863525390625, -4.478515625, -4.093505859375, -3.70849609375, -3.323486328125, -2.9384765625, -2.553466796875, -2.16845703125, -1.783447265625, -1.3984375, -1.013427734375, -0.62841796875, -0.243408203125, 0.1416015625, 0.526611328125, 0.91162109375, 1.296630859375, 1.681640625, 2.066650390625, 2.45166015625, 2.836669921875, 3.2216796875, 3.606689453125, 3.99169921875, 4.376708984375, 4.76171875, 5.146728515625, 5.53173828125, 5.916748046875, 6.3017578125, 6.686767578125, 7.07177734375, 7.456787109375, 7.841796875, 8.226806640625, 8.61181640625, 8.996826171875, 9.3818359375, 9.766845703125, 10.15185546875, 10.536865234375, 10.921875]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 4.0, 9.0, 17.0, 18.0, 17.0, 18.0, 22.0, 42.0, 47.0, 80.0, 96.0, 124.0, 197.0, 326.0, 448.0, 765.0, 1243.0, 2285.0, 4802.0, 10500.0, 28105.0, 93399.0, 406766.0, 1473039.0, 1561323.0, 450829.0, 106752.0, 30732.0, 11321.0, 4928.0, 2471.0, 1315.0, 783.0, 461.0, 313.0, 205.0, 119.0, 97.0, 52.0, 54.0, 29.0, 23.0, 21.0, 19.0, 20.0, 14.0, 4.0, 12.0, 6.0, 5.0, 1.0, 4.0, 3.0], "bins": [-17.890625, -17.3800048828125, -16.869384765625, -16.3587646484375, -15.84814453125, -15.3375244140625, -14.826904296875, -14.3162841796875, -13.8056640625, -13.2950439453125, -12.784423828125, -12.2738037109375, -11.76318359375, -11.2525634765625, -10.741943359375, -10.2313232421875, -9.720703125, -9.2100830078125, -8.699462890625, -8.1888427734375, -7.67822265625, -7.1676025390625, -6.656982421875, -6.1463623046875, -5.6357421875, -5.1251220703125, -4.614501953125, -4.1038818359375, -3.59326171875, -3.0826416015625, -2.572021484375, -2.0614013671875, -1.55078125, -1.0401611328125, -0.529541015625, -0.0189208984375, 0.49169921875, 1.0023193359375, 1.512939453125, 2.0235595703125, 2.5341796875, 3.0447998046875, 3.555419921875, 4.0660400390625, 4.57666015625, 5.0872802734375, 5.597900390625, 6.1085205078125, 6.619140625, 7.1297607421875, 7.640380859375, 8.1510009765625, 8.66162109375, 9.1722412109375, 9.682861328125, 10.1934814453125, 10.7041015625, 11.2147216796875, 11.725341796875, 12.2359619140625, 12.74658203125, 13.2572021484375, 13.767822265625, 14.2784423828125, 14.7890625]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 1.0, 4.0, 4.0, 4.0, 4.0, 8.0, 6.0, 18.0, 24.0, 24.0, 47.0, 59.0, 67.0, 85.0, 115.0, 132.0, 201.0, 248.0, 353.0, 399.0, 426.0, 378.0, 328.0, 277.0, 209.0, 156.0, 130.0, 86.0, 56.0, 54.0, 38.0, 33.0, 30.0, 13.0, 19.0, 10.0, 9.0, 6.0, 6.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-12.265625, -11.744140625, -11.22265625, -10.701171875, -10.1796875, -9.658203125, -9.13671875, -8.615234375, -8.09375, -7.572265625, -7.05078125, -6.529296875, -6.0078125, -5.486328125, -4.96484375, -4.443359375, -3.921875, -3.400390625, -2.87890625, -2.357421875, -1.8359375, -1.314453125, -0.79296875, -0.271484375, 0.25, 0.771484375, 1.29296875, 1.814453125, 2.3359375, 2.857421875, 3.37890625, 3.900390625, 4.421875, 4.943359375, 5.46484375, 5.986328125, 6.5078125, 7.029296875, 7.55078125, 8.072265625, 8.59375, 9.115234375, 9.63671875, 10.158203125, 10.6796875, 11.201171875, 11.72265625, 12.244140625, 12.765625, 13.287109375, 13.80859375, 14.330078125, 14.8515625, 15.373046875, 15.89453125, 16.416015625, 16.9375, 17.458984375, 17.98046875, 18.501953125, 19.0234375, 19.544921875, 20.06640625, 20.587890625, 21.109375]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 4.0, 5.0, 8.0, 15.0, 20.0, 29.0, 34.0, 35.0, 53.0, 82.0, 101.0, 151.0, 239.0, 403.0, 805.0, 2849.0, 19451.0, 296060.0, 3511682.0, 335701.0, 21488.0, 2987.0, 881.0, 398.0, 220.0, 181.0, 110.0, 76.0, 67.0, 36.0, 29.0, 16.0, 19.0, 10.0, 12.0, 8.0, 6.0, 3.0, 6.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-52.0, -50.40087890625, -48.8017578125, -47.20263671875, -45.603515625, -44.00439453125, -42.4052734375, -40.80615234375, -39.20703125, -37.60791015625, -36.0087890625, -34.40966796875, -32.810546875, -31.21142578125, -29.6123046875, -28.01318359375, -26.4140625, -24.81494140625, -23.2158203125, -21.61669921875, -20.017578125, -18.41845703125, -16.8193359375, -15.22021484375, -13.62109375, -12.02197265625, -10.4228515625, -8.82373046875, -7.224609375, -5.62548828125, -4.0263671875, -2.42724609375, -0.828125, 0.77099609375, 2.3701171875, 3.96923828125, 5.568359375, 7.16748046875, 8.7666015625, 10.36572265625, 11.96484375, 13.56396484375, 15.1630859375, 16.76220703125, 18.361328125, 19.96044921875, 21.5595703125, 23.15869140625, 24.7578125, 26.35693359375, 27.9560546875, 29.55517578125, 31.154296875, 32.75341796875, 34.3525390625, 35.95166015625, 37.55078125, 39.14990234375, 40.7490234375, 42.34814453125, 43.947265625, 45.54638671875, 47.1455078125, 48.74462890625, 50.34375]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 20.0, 235.0, 554.0, 187.0, 15.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-687.9711303710938, -675.7628173828125, -663.5545043945312, -651.34619140625, -639.1378784179688, -626.9295654296875, -614.7212524414062, -602.512939453125, -590.3046264648438, -578.0963134765625, -565.8880004882812, -553.6796875, -541.4713745117188, -529.2630615234375, -517.0547485351562, -504.846435546875, -492.63812255859375, -480.4298095703125, -468.22149658203125, -456.01318359375, -443.80487060546875, -431.5965576171875, -419.38824462890625, -407.179931640625, -394.9715881347656, -382.7632751464844, -370.5549621582031, -358.3466491699219, -346.1383361816406, -333.9300231933594, -321.7217102050781, -309.5133972167969, -297.3050537109375, -285.09674072265625, -272.888427734375, -260.68011474609375, -248.4718017578125, -236.26348876953125, -224.05517578125, -211.84686279296875, -199.6385498046875, -187.43023681640625, -175.221923828125, -163.01361083984375, -150.8052978515625, -138.59698486328125, -126.38866424560547, -114.18035125732422, -101.97203826904297, -89.76372528076172, -77.55541229248047, -65.34709167480469, -53.1387825012207, -40.93046951293945, -28.722152709960938, -16.513839721679688, -4.3055267333984375, 7.902787208557129, 20.111101150512695, 32.31941604614258, 44.52772903442383, 56.73604202270508, 68.9443588256836, 81.15267181396484, 93.3609848022461]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 5.0, 0.0, 7.0, 5.0, 14.0, 11.0, 6.0, 17.0, 11.0, 14.0, 15.0, 15.0, 25.0, 17.0, 41.0, 24.0, 36.0, 31.0, 34.0, 34.0, 42.0, 43.0, 38.0, 29.0, 42.0, 40.0, 39.0, 30.0, 44.0, 35.0, 32.0, 30.0, 19.0, 27.0, 24.0, 12.0, 14.0, 10.0, 21.0, 11.0, 14.0, 12.0, 9.0, 8.0, 5.0, 3.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-61.10502624511719, -59.18751525878906, -57.27000045776367, -55.35248947143555, -53.434974670410156, -51.51746368408203, -49.599952697753906, -47.682437896728516, -45.764923095703125, -43.847412109375, -41.92989730834961, -40.012386322021484, -38.094871520996094, -36.17736053466797, -34.259849548339844, -32.34233474731445, -30.424823760986328, -28.50731086730957, -26.589797973632812, -24.672286987304688, -22.754772186279297, -20.837261199951172, -18.919748306274414, -17.002235412597656, -15.084722518920898, -13.16720962524414, -11.249696731567383, -9.332184791564941, -7.414671897888184, -5.497159004211426, -3.5796470642089844, -1.6621341705322266, 0.25537872314453125, 2.17289137840271, 4.090404033660889, 6.007916450500488, 7.925429344177246, 9.842942237854004, 11.760454177856445, 13.677967071533203, 15.595479965209961, 17.51299285888672, 19.430505752563477, 21.348018646240234, 23.26552963256836, 25.18304443359375, 27.100555419921875, 29.018068313598633, 30.93558120727539, 32.853092193603516, 34.770606994628906, 36.68811798095703, 38.60563278198242, 40.52314376831055, 42.44065856933594, 44.35816955566406, 46.27568054199219, 48.19319152832031, 50.1107063293457, 52.02821731567383, 53.94573211669922, 55.863243103027344, 57.78075408935547, 59.69826889038086, 61.61578369140625]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 6.0, 4.0, 0.0, 7.0, 5.0, 6.0, 11.0, 12.0, 12.0, 15.0, 19.0, 18.0, 33.0, 18.0, 23.0, 30.0, 32.0, 44.0, 32.0, 46.0, 36.0, 39.0, 52.0, 48.0, 31.0, 42.0, 36.0, 29.0, 39.0, 33.0, 26.0, 23.0, 32.0, 24.0, 26.0, 20.0, 19.0, 19.0, 18.0, 17.0, 4.0, 6.0, 8.0, 4.0, 2.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.109375, -11.7120361328125, -11.314697265625, -10.9173583984375, -10.52001953125, -10.1226806640625, -9.725341796875, -9.3280029296875, -8.9306640625, -8.5333251953125, -8.135986328125, -7.7386474609375, -7.34130859375, -6.9439697265625, -6.546630859375, -6.1492919921875, -5.751953125, -5.3546142578125, -4.957275390625, -4.5599365234375, -4.16259765625, -3.7652587890625, -3.367919921875, -2.9705810546875, -2.5732421875, -2.1759033203125, -1.778564453125, -1.3812255859375, -0.98388671875, -0.5865478515625, -0.189208984375, 0.2081298828125, 0.60546875, 1.0028076171875, 1.400146484375, 1.7974853515625, 2.19482421875, 2.5921630859375, 2.989501953125, 3.3868408203125, 3.7841796875, 4.1815185546875, 4.578857421875, 4.9761962890625, 5.37353515625, 5.7708740234375, 6.168212890625, 6.5655517578125, 6.962890625, 7.3602294921875, 7.757568359375, 8.1549072265625, 8.55224609375, 8.9495849609375, 9.346923828125, 9.7442626953125, 10.1416015625, 10.5389404296875, 10.936279296875, 11.3336181640625, 11.73095703125, 12.1282958984375, 12.525634765625, 12.9229736328125, 13.3203125]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 2.0, 4.0, 8.0, 20.0, 15.0, 32.0, 59.0, 73.0, 113.0, 151.0, 213.0, 329.0, 464.0, 667.0, 1016.0, 1528.0, 2156.0, 3040.0, 4775.0, 6824.0, 10245.0, 15372.0, 23140.0, 34889.0, 51994.0, 76524.0, 106587.0, 136150.0, 147000.0, 126619.0, 95173.0, 66710.0, 45156.0, 29931.0, 20370.0, 13392.0, 9096.0, 6021.0, 3972.0, 2743.0, 1928.0, 1232.0, 860.0, 621.0, 437.0, 306.0, 223.0, 136.0, 85.0, 55.0, 48.0, 24.0, 13.0, 9.0, 2.0, 5.0, 5.0, 3.0, 2.0, 1.0], "bins": [-0.7548828125, -0.7315292358398438, -0.7081756591796875, -0.6848220825195312, -0.661468505859375, -0.6381149291992188, -0.6147613525390625, -0.5914077758789062, -0.56805419921875, -0.5447006225585938, -0.5213470458984375, -0.49799346923828125, -0.474639892578125, -0.45128631591796875, -0.4279327392578125, -0.40457916259765625, -0.3812255859375, -0.35787200927734375, -0.3345184326171875, -0.31116485595703125, -0.287811279296875, -0.26445770263671875, -0.2411041259765625, -0.21775054931640625, -0.19439697265625, -0.17104339599609375, -0.1476898193359375, -0.12433624267578125, -0.100982666015625, -0.07762908935546875, -0.0542755126953125, -0.03092193603515625, -0.007568359375, 0.01578521728515625, 0.0391387939453125, 0.06249237060546875, 0.085845947265625, 0.10919952392578125, 0.1325531005859375, 0.15590667724609375, 0.17926025390625, 0.20261383056640625, 0.2259674072265625, 0.24932098388671875, 0.272674560546875, 0.29602813720703125, 0.3193817138671875, 0.34273529052734375, 0.3660888671875, 0.38944244384765625, 0.4127960205078125, 0.43614959716796875, 0.459503173828125, 0.48285675048828125, 0.5062103271484375, 0.5295639038085938, 0.55291748046875, 0.5762710571289062, 0.5996246337890625, 0.6229782104492188, 0.646331787109375, 0.6696853637695312, 0.6930389404296875, 0.7163925170898438, 0.73974609375]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 7.0, 6.0, 8.0, 2.0, 8.0, 6.0, 11.0, 11.0, 12.0, 17.0, 24.0, 21.0, 29.0, 36.0, 35.0, 27.0, 30.0, 27.0, 41.0, 44.0, 39.0, 38.0, 1075.0, 41.0, 38.0, 57.0, 33.0, 36.0, 20.0, 45.0, 23.0, 30.0, 27.0, 23.0, 22.0, 23.0, 8.0, 17.0, 5.0, 4.0, 8.0, 10.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.53125, -8.269775390625, -8.00830078125, -7.746826171875, -7.4853515625, -7.223876953125, -6.96240234375, -6.700927734375, -6.439453125, -6.177978515625, -5.91650390625, -5.655029296875, -5.3935546875, -5.132080078125, -4.87060546875, -4.609130859375, -4.34765625, -4.086181640625, -3.82470703125, -3.563232421875, -3.3017578125, -3.040283203125, -2.77880859375, -2.517333984375, -2.255859375, -1.994384765625, -1.73291015625, -1.471435546875, -1.2099609375, -0.948486328125, -0.68701171875, -0.425537109375, -0.1640625, 0.097412109375, 0.35888671875, 0.620361328125, 0.8818359375, 1.143310546875, 1.40478515625, 1.666259765625, 1.927734375, 2.189208984375, 2.45068359375, 2.712158203125, 2.9736328125, 3.235107421875, 3.49658203125, 3.758056640625, 4.01953125, 4.281005859375, 4.54248046875, 4.803955078125, 5.0654296875, 5.326904296875, 5.58837890625, 5.849853515625, 6.111328125, 6.372802734375, 6.63427734375, 6.895751953125, 7.1572265625, 7.418701171875, 7.68017578125, 7.941650390625, 8.203125]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 6.0, 10.0, 11.0, 18.0, 18.0, 42.0, 42.0, 64.0, 120.0, 189.0, 273.0, 415.0, 708.0, 1165.0, 1905.0, 3087.0, 5387.0, 8808.0, 15093.0, 25300.0, 42376.0, 69904.0, 108399.0, 159896.0, 1205436.0, 161385.0, 109472.0, 70650.0, 43246.0, 25881.0, 15203.0, 8982.0, 5373.0, 3277.0, 1952.0, 1189.0, 644.0, 422.0, 302.0, 165.0, 111.0, 72.0, 48.0, 27.0, 26.0, 15.0, 7.0, 7.0, 1.0, 5.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.70556640625, -0.6831741333007812, -0.6607818603515625, -0.6383895874023438, -0.615997314453125, -0.5936050415039062, -0.5712127685546875, -0.5488204956054688, -0.52642822265625, -0.5040359497070312, -0.4816436767578125, -0.45925140380859375, -0.436859130859375, -0.41446685791015625, -0.3920745849609375, -0.36968231201171875, -0.3472900390625, -0.32489776611328125, -0.3025054931640625, -0.28011322021484375, -0.257720947265625, -0.23532867431640625, -0.2129364013671875, -0.19054412841796875, -0.16815185546875, -0.14575958251953125, -0.1233673095703125, -0.10097503662109375, -0.078582763671875, -0.05619049072265625, -0.0337982177734375, -0.01140594482421875, 0.010986328125, 0.03337860107421875, 0.0557708740234375, 0.07816314697265625, 0.100555419921875, 0.12294769287109375, 0.1453399658203125, 0.16773223876953125, 0.19012451171875, 0.21251678466796875, 0.2349090576171875, 0.25730133056640625, 0.279693603515625, 0.30208587646484375, 0.3244781494140625, 0.34687042236328125, 0.3692626953125, 0.39165496826171875, 0.4140472412109375, 0.43643951416015625, 0.458831787109375, 0.48122406005859375, 0.5036163330078125, 0.5260086059570312, 0.54840087890625, 0.5707931518554688, 0.5931854248046875, 0.6155776977539062, 0.637969970703125, 0.6603622436523438, 0.6827545166015625, 0.7051467895507812, 0.7275390625]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 0.0, 2.0, 3.0, 8.0, 3.0, 10.0, 3.0, 5.0, 5.0, 8.0, 6.0, 10.0, 10.0, 9.0, 15.0, 23.0, 20.0, 26.0, 26.0, 34.0, 44.0, 38.0, 57.0, 74.0, 79.0, 76.0, 65.0, 53.0, 42.0, 32.0, 25.0, 26.0, 28.0, 18.0, 15.0, 20.0, 11.0, 16.0, 14.0, 6.0, 8.0, 11.0, 5.0, 6.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0], "bins": [-0.0266265869140625, -0.025838851928710938, -0.025051116943359375, -0.024263381958007812, -0.02347564697265625, -0.022687911987304688, -0.021900177001953125, -0.021112442016601562, -0.02032470703125, -0.019536972045898438, -0.018749237060546875, -0.017961502075195312, -0.01717376708984375, -0.016386032104492188, -0.015598297119140625, -0.014810562133789062, -0.0140228271484375, -0.013235092163085938, -0.012447357177734375, -0.011659622192382812, -0.01087188720703125, -0.010084152221679688, -0.009296417236328125, -0.008508682250976562, -0.007720947265625, -0.0069332122802734375, -0.006145477294921875, -0.0053577423095703125, -0.00457000732421875, -0.0037822723388671875, -0.002994537353515625, -0.0022068023681640625, -0.0014190673828125, -0.0006313323974609375, 0.000156402587890625, 0.0009441375732421875, 0.00173187255859375, 0.0025196075439453125, 0.003307342529296875, 0.0040950775146484375, 0.0048828125, 0.0056705474853515625, 0.006458282470703125, 0.0072460174560546875, 0.00803375244140625, 0.008821487426757812, 0.009609222412109375, 0.010396957397460938, 0.0111846923828125, 0.011972427368164062, 0.012760162353515625, 0.013547897338867188, 0.01433563232421875, 0.015123367309570312, 0.015911102294921875, 0.016698837280273438, 0.017486572265625, 0.018274307250976562, 0.019062042236328125, 0.019849777221679688, 0.02063751220703125, 0.021425247192382812, 0.022212982177734375, 0.023000717163085938, 0.0237884521484375]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 0.0, 6.0, 8.0, 10.0, 9.0, 16.0, 10.0, 16.0, 31.0, 20.0, 24.0, 30.0, 39.0, 64.0, 70.0, 101.0, 127.0, 191.0, 312.0, 588.0, 5432.0, 1000605.0, 38767.0, 834.0, 387.0, 210.0, 167.0, 115.0, 81.0, 44.0, 42.0, 40.0, 20.0, 21.0, 17.0, 8.0, 16.0, 20.0, 9.0, 8.0, 12.0, 7.0, 5.0, 5.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.468505859375, -0.4527168273925781, -0.43692779541015625, -0.4211387634277344, -0.4053497314453125, -0.3895606994628906, -0.37377166748046875, -0.3579826354980469, -0.342193603515625, -0.3264045715332031, -0.31061553955078125, -0.2948265075683594, -0.2790374755859375, -0.2632484436035156, -0.24745941162109375, -0.23167037963867188, -0.21588134765625, -0.20009231567382812, -0.18430328369140625, -0.16851425170898438, -0.1527252197265625, -0.13693618774414062, -0.12114715576171875, -0.10535812377929688, -0.089569091796875, -0.07378005981445312, -0.05799102783203125, -0.042201995849609375, -0.0264129638671875, -0.010623931884765625, 0.00516510009765625, 0.020954132080078125, 0.0367431640625, 0.052532196044921875, 0.06832122802734375, 0.08411026000976562, 0.0998992919921875, 0.11568832397460938, 0.13147735595703125, 0.14726638793945312, 0.163055419921875, 0.17884445190429688, 0.19463348388671875, 0.21042251586914062, 0.2262115478515625, 0.24200057983398438, 0.25778961181640625, 0.2735786437988281, 0.28936767578125, 0.3051567077636719, 0.32094573974609375, 0.3367347717285156, 0.3525238037109375, 0.3683128356933594, 0.38410186767578125, 0.3998908996582031, 0.415679931640625, 0.4314689636230469, 0.44725799560546875, 0.4630470275878906, 0.4788360595703125, 0.4946250915527344, 0.5104141235351562, 0.5262031555175781, 0.5419921875]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [327.0, 690.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.014319967478513718, -0.0008359970524907112, 0.012647973373532295, 0.026131942868232727, 0.03961591422557831, 0.05309988185763359, 0.06658385694026947, 0.08006782829761505, 0.09355179965496063, 0.10703577101230621, 0.1205197423696518, 0.13400371372699738, 0.14748768508434296, 0.16097164154052734, 0.17445561289787292, 0.1879395842552185, 0.2014235556125641, 0.21490752696990967, 0.22839149832725525, 0.24187546968460083, 0.2553594410419464, 0.268843412399292, 0.2823273837566376, 0.29581135511398315, 0.30929532647132874, 0.3227792978286743, 0.3362632691860199, 0.3497472405433655, 0.36323121190071106, 0.37671518325805664, 0.3901991546154022, 0.4036831259727478, 0.4171670973300934, 0.43065106868743896, 0.44413504004478455, 0.4576190114021301, 0.4711029827594757, 0.4845869541168213, 0.49807092547416687, 0.5115548968315125, 0.5250388383865356, 0.5385227799415588, 0.5520067811012268, 0.56549072265625, 0.578974723815918, 0.5924586653709412, 0.6059426665306091, 0.6194266080856323, 0.6329106092453003, 0.6463945508003235, 0.6598785519599915, 0.6733624935150146, 0.6868464946746826, 0.7003304362297058, 0.7138144373893738, 0.727298378944397, 0.7407823801040649, 0.7542663216590881, 0.7677503228187561, 0.7812342643737793, 0.7947182655334473, 0.8082022070884705, 0.8216862082481384, 0.8351701498031616, 0.8486541509628296]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 8.0, 9.0, 18.0, 22.0, 25.0, 37.0, 42.0, 53.0, 69.0, 79.0, 86.0, 94.0, 88.0, 60.0, 70.0, 60.0, 47.0, 39.0, 34.0, 21.0, 21.0, 12.0, 9.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.039733052253723145, -0.038698434829711914, -0.037663817405700684, -0.036629196256399155, -0.035594578832387924, -0.034559961408376694, -0.033525340259075165, -0.032490722835063934, -0.031456105411052704, -0.030421487987041473, -0.029386868700385094, -0.028352249413728714, -0.027317631989717484, -0.026283014565706253, -0.025248395279049873, -0.024213775992393494, -0.023179158568382263, -0.022144541144371033, -0.021109921857714653, -0.020075302571058273, -0.019040685147047043, -0.018006067723035812, -0.016971448436379433, -0.015936829149723053, -0.014902211725711823, -0.013867593370378017, -0.012832975015044212, -0.011798356659710407, -0.010763738304376602, -0.009729119949042797, -0.008694501593708992, -0.007659883238375187, -0.006625264883041382, -0.005590646527707577, -0.004556028172373772, -0.0035214098170399666, -0.0024867914617061615, -0.0014521731063723564, -0.00041755475103855133, 0.0006170636042952538, 0.0016516819596290588, 0.002686300314962864, 0.003720918670296669, 0.004755537025630474, 0.005790155380964279, 0.006824773736298084, 0.00785939209163189, 0.008894010446965694, 0.0099286288022995, 0.010963247157633305, 0.01199786551296711, 0.013032483868300915, 0.01406710222363472, 0.015101720578968525, 0.01613633893430233, 0.01717095822095871, 0.01820557564496994, 0.01924019306898117, 0.02027481235563755, 0.02130943164229393, 0.02234404906630516, 0.02337866649031639, 0.02441328577697277, 0.02544790506362915, 0.02648252248764038]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 6.0, 4.0, 0.0, 7.0, 5.0, 6.0, 10.0, 13.0, 11.0, 16.0, 19.0, 18.0, 33.0, 18.0, 23.0, 30.0, 31.0, 45.0, 32.0, 46.0, 35.0, 40.0, 51.0, 49.0, 30.0, 42.0, 37.0, 29.0, 39.0, 33.0, 26.0, 23.0, 32.0, 23.0, 27.0, 20.0, 19.0, 19.0, 18.0, 17.0, 4.0, 6.0, 8.0, 4.0, 2.0, 3.0, 2.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.109375, -11.712158203125, -11.31494140625, -10.917724609375, -10.5205078125, -10.123291015625, -9.72607421875, -9.328857421875, -8.931640625, -8.534423828125, -8.13720703125, -7.739990234375, -7.3427734375, -6.945556640625, -6.54833984375, -6.151123046875, -5.75390625, -5.356689453125, -4.95947265625, -4.562255859375, -4.1650390625, -3.767822265625, -3.37060546875, -2.973388671875, -2.576171875, -2.178955078125, -1.78173828125, -1.384521484375, -0.9873046875, -0.590087890625, -0.19287109375, 0.204345703125, 0.6015625, 0.998779296875, 1.39599609375, 1.793212890625, 2.1904296875, 2.587646484375, 2.98486328125, 3.382080078125, 3.779296875, 4.176513671875, 4.57373046875, 4.970947265625, 5.3681640625, 5.765380859375, 6.16259765625, 6.559814453125, 6.95703125, 7.354248046875, 7.75146484375, 8.148681640625, 8.5458984375, 8.943115234375, 9.34033203125, 9.737548828125, 10.134765625, 10.531982421875, 10.92919921875, 11.326416015625, 11.7236328125, 12.120849609375, 12.51806640625, 12.915283203125, 13.3125]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 4.0, 3.0, 6.0, 3.0, 13.0, 8.0, 12.0, 19.0, 24.0, 37.0, 49.0, 52.0, 75.0, 88.0, 147.0, 234.0, 310.0, 483.0, 893.0, 1596.0, 3018.0, 6179.0, 12802.0, 28352.0, 65796.0, 168410.0, 424052.0, 198642.0, 75742.0, 32274.0, 14606.0, 6871.0, 3385.0, 1797.0, 944.0, 541.0, 311.0, 230.0, 143.0, 80.0, 78.0, 66.0, 56.0, 35.0, 22.0, 24.0, 21.0, 10.0, 4.0, 10.0, 7.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-15.3828125, -14.8797607421875, -14.376708984375, -13.8736572265625, -13.37060546875, -12.8675537109375, -12.364501953125, -11.8614501953125, -11.3583984375, -10.8553466796875, -10.352294921875, -9.8492431640625, -9.34619140625, -8.8431396484375, -8.340087890625, -7.8370361328125, -7.333984375, -6.8309326171875, -6.327880859375, -5.8248291015625, -5.32177734375, -4.8187255859375, -4.315673828125, -3.8126220703125, -3.3095703125, -2.8065185546875, -2.303466796875, -1.8004150390625, -1.29736328125, -0.7943115234375, -0.291259765625, 0.2117919921875, 0.71484375, 1.2178955078125, 1.720947265625, 2.2239990234375, 2.72705078125, 3.2301025390625, 3.733154296875, 4.2362060546875, 4.7392578125, 5.2423095703125, 5.745361328125, 6.2484130859375, 6.75146484375, 7.2545166015625, 7.757568359375, 8.2606201171875, 8.763671875, 9.2667236328125, 9.769775390625, 10.2728271484375, 10.77587890625, 11.2789306640625, 11.781982421875, 12.2850341796875, 12.7880859375, 13.2911376953125, 13.794189453125, 14.2972412109375, 14.80029296875, 15.3033447265625, 15.806396484375, 16.3094482421875, 16.8125]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 3.0, 3.0, 7.0, 4.0, 3.0, 13.0, 11.0, 14.0, 18.0, 22.0, 20.0, 26.0, 24.0, 29.0, 42.0, 40.0, 59.0, 55.0, 78.0, 111.0, 221.0, 1494.0, 227.0, 98.0, 77.0, 55.0, 40.0, 49.0, 37.0, 27.0, 24.0, 22.0, 15.0, 17.0, 11.0, 14.0, 9.0, 11.0, 6.0, 4.0, 4.0, 1.0, 4.0, 1.0, 3.0, 0.0, 4.0, 3.0, 0.0, 1.0], "bins": [-39.375, -38.262939453125, -37.15087890625, -36.038818359375, -34.9267578125, -33.814697265625, -32.70263671875, -31.590576171875, -30.478515625, -29.366455078125, -28.25439453125, -27.142333984375, -26.0302734375, -24.918212890625, -23.80615234375, -22.694091796875, -21.58203125, -20.469970703125, -19.35791015625, -18.245849609375, -17.1337890625, -16.021728515625, -14.90966796875, -13.797607421875, -12.685546875, -11.573486328125, -10.46142578125, -9.349365234375, -8.2373046875, -7.125244140625, -6.01318359375, -4.901123046875, -3.7890625, -2.677001953125, -1.56494140625, -0.452880859375, 0.6591796875, 1.771240234375, 2.88330078125, 3.995361328125, 5.107421875, 6.219482421875, 7.33154296875, 8.443603515625, 9.5556640625, 10.667724609375, 11.77978515625, 12.891845703125, 14.00390625, 15.115966796875, 16.22802734375, 17.340087890625, 18.4521484375, 19.564208984375, 20.67626953125, 21.788330078125, 22.900390625, 24.012451171875, 25.12451171875, 26.236572265625, 27.3486328125, 28.460693359375, 29.57275390625, 30.684814453125, 31.796875]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 6.0, 2.0, 4.0, 2.0, 8.0, 15.0, 9.0, 12.0, 27.0, 35.0, 31.0, 46.0, 65.0, 92.0, 120.0, 181.0, 361.0, 841.0, 4297.0, 60593.0, 2777603.0, 287346.0, 11384.0, 1395.0, 432.0, 233.0, 156.0, 117.0, 84.0, 56.0, 39.0, 34.0, 18.0, 19.0, 13.0, 7.0, 8.0, 9.0, 5.0, 0.0, 4.0, 1.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-50.59375, -48.76806640625, -46.9423828125, -45.11669921875, -43.291015625, -41.46533203125, -39.6396484375, -37.81396484375, -35.98828125, -34.16259765625, -32.3369140625, -30.51123046875, -28.685546875, -26.85986328125, -25.0341796875, -23.20849609375, -21.3828125, -19.55712890625, -17.7314453125, -15.90576171875, -14.080078125, -12.25439453125, -10.4287109375, -8.60302734375, -6.77734375, -4.95166015625, -3.1259765625, -1.30029296875, 0.525390625, 2.35107421875, 4.1767578125, 6.00244140625, 7.828125, 9.65380859375, 11.4794921875, 13.30517578125, 15.130859375, 16.95654296875, 18.7822265625, 20.60791015625, 22.43359375, 24.25927734375, 26.0849609375, 27.91064453125, 29.736328125, 31.56201171875, 33.3876953125, 35.21337890625, 37.0390625, 38.86474609375, 40.6904296875, 42.51611328125, 44.341796875, 46.16748046875, 47.9931640625, 49.81884765625, 51.64453125, 53.47021484375, 55.2958984375, 57.12158203125, 58.947265625, 60.77294921875, 62.5986328125, 64.42431640625, 66.25]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 12.0, 89.0, 332.0, 393.0, 151.0, 36.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.53226089477539, -40.807098388671875, -35.081932067871094, -29.356769561767578, -23.631607055664062, -17.906444549560547, -12.181278228759766, -6.45611572265625, -0.7309532165527344, 4.994210243225098, 10.71937370300293, 16.444538116455078, 22.169700622558594, 27.89486312866211, 33.62002944946289, 39.345191955566406, 45.07035446166992, 50.79551696777344, 56.52068328857422, 62.245845794677734, 67.97100830078125, 73.6961669921875, 79.42134094238281, 85.14649963378906, 90.87165832519531, 96.5968246459961, 102.32198333740234, 108.04714965820312, 113.77230834960938, 119.49747467041016, 125.22264099121094, 130.9477996826172, 136.6729736328125, 142.39813232421875, 148.12330627441406, 153.8484649658203, 159.57362365722656, 165.29879760742188, 171.02395629882812, 176.74911499023438, 182.47427368164062, 188.19943237304688, 193.9246063232422, 199.64976501464844, 205.3749237060547, 211.10009765625, 216.82525634765625, 222.5504150390625, 228.2755889892578, 234.00074768066406, 239.72592163085938, 245.45108032226562, 251.17623901367188, 256.9013977050781, 262.6265869140625, 268.35174560546875, 274.076904296875, 279.80206298828125, 285.5272216796875, 291.25238037109375, 296.9775695800781, 302.7027282714844, 308.4278869628906, 314.1530456542969, 319.8782043457031]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 4.0, 3.0, 3.0, 6.0, 5.0, 6.0, 9.0, 12.0, 12.0, 16.0, 11.0, 18.0, 18.0, 18.0, 19.0, 19.0, 43.0, 31.0, 30.0, 30.0, 29.0, 51.0, 25.0, 36.0, 45.0, 30.0, 27.0, 46.0, 40.0, 35.0, 34.0, 28.0, 31.0, 19.0, 36.0, 25.0, 27.0, 14.0, 21.0, 14.0, 17.0, 13.0, 12.0, 7.0, 9.0, 5.0, 5.0, 4.0, 7.0, 1.0, 2.0, 5.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-61.914642333984375, -59.86324691772461, -57.81185531616211, -55.760459899902344, -53.709068298339844, -51.65767288208008, -49.60627746582031, -47.55488586425781, -45.50349044799805, -43.45209503173828, -41.40070343017578, -39.349308013916016, -37.29791259765625, -35.24652099609375, -33.195125579833984, -31.14373207092285, -29.09233856201172, -27.040945053100586, -24.989551544189453, -22.938156127929688, -20.886762619018555, -18.835369110107422, -16.783973693847656, -14.732580184936523, -12.68118667602539, -10.629793167114258, -8.578398704528809, -6.527004718780518, -4.475610733032227, -2.4242172241210938, -0.37282276153564453, 1.6785717010498047, 3.7299652099609375, 5.7813591957092285, 7.8327531814575195, 9.884147644042969, 11.935541152954102, 13.986934661865234, 16.038330078125, 18.089723587036133, 20.141117095947266, 22.1925106048584, 24.24390411376953, 26.295299530029297, 28.34669303894043, 30.398086547851562, 32.44948196411133, 34.500877380371094, 36.552268981933594, 38.60366439819336, 40.65505599975586, 42.706451416015625, 44.757843017578125, 46.80923843383789, 48.860633850097656, 50.912025451660156, 52.96342086791992, 55.01481628417969, 57.06620788574219, 59.11760330200195, 61.16899871826172, 63.22039031982422, 65.27178192138672, 67.32318115234375, 69.37457275390625]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 2.0, 5.0, 2.0, 3.0, 9.0, 8.0, 11.0, 13.0, 18.0, 11.0, 18.0, 24.0, 29.0, 31.0, 29.0, 33.0, 31.0, 36.0, 38.0, 45.0, 33.0, 47.0, 51.0, 45.0, 51.0, 39.0, 37.0, 30.0, 34.0, 29.0, 26.0, 19.0, 24.0, 25.0, 22.0, 20.0, 14.0, 15.0, 12.0, 13.0, 4.0, 11.0, 4.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-14.5, -14.080322265625, -13.66064453125, -13.240966796875, -12.8212890625, -12.401611328125, -11.98193359375, -11.562255859375, -11.142578125, -10.722900390625, -10.30322265625, -9.883544921875, -9.4638671875, -9.044189453125, -8.62451171875, -8.204833984375, -7.78515625, -7.365478515625, -6.94580078125, -6.526123046875, -6.1064453125, -5.686767578125, -5.26708984375, -4.847412109375, -4.427734375, -4.008056640625, -3.58837890625, -3.168701171875, -2.7490234375, -2.329345703125, -1.90966796875, -1.489990234375, -1.0703125, -0.650634765625, -0.23095703125, 0.188720703125, 0.6083984375, 1.028076171875, 1.44775390625, 1.867431640625, 2.287109375, 2.706787109375, 3.12646484375, 3.546142578125, 3.9658203125, 4.385498046875, 4.80517578125, 5.224853515625, 5.64453125, 6.064208984375, 6.48388671875, 6.903564453125, 7.3232421875, 7.742919921875, 8.16259765625, 8.582275390625, 9.001953125, 9.421630859375, 9.84130859375, 10.260986328125, 10.6806640625, 11.100341796875, 11.52001953125, 11.939697265625, 12.359375]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 5.0, 2.0, 7.0, 6.0, 4.0, 12.0, 14.0, 9.0, 16.0, 15.0, 28.0, 36.0, 44.0, 81.0, 129.0, 265.0, 510.0, 1032.0, 2466.0, 6713.0, 23219.0, 116923.0, 789428.0, 2293808.0, 806129.0, 117801.0, 23948.0, 6833.0, 2486.0, 1093.0, 510.0, 283.0, 163.0, 96.0, 42.0, 24.0, 20.0, 20.0, 16.0, 12.0, 5.0, 14.0, 3.0, 4.0, 3.0, 2.0, 2.0, 3.0, 6.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.5, -18.839111328125, -18.17822265625, -17.517333984375, -16.8564453125, -16.195556640625, -15.53466796875, -14.873779296875, -14.212890625, -13.552001953125, -12.89111328125, -12.230224609375, -11.5693359375, -10.908447265625, -10.24755859375, -9.586669921875, -8.92578125, -8.264892578125, -7.60400390625, -6.943115234375, -6.2822265625, -5.621337890625, -4.96044921875, -4.299560546875, -3.638671875, -2.977783203125, -2.31689453125, -1.656005859375, -0.9951171875, -0.334228515625, 0.32666015625, 0.987548828125, 1.6484375, 2.309326171875, 2.97021484375, 3.631103515625, 4.2919921875, 4.952880859375, 5.61376953125, 6.274658203125, 6.935546875, 7.596435546875, 8.25732421875, 8.918212890625, 9.5791015625, 10.239990234375, 10.90087890625, 11.561767578125, 12.22265625, 12.883544921875, 13.54443359375, 14.205322265625, 14.8662109375, 15.527099609375, 16.18798828125, 16.848876953125, 17.509765625, 18.170654296875, 18.83154296875, 19.492431640625, 20.1533203125, 20.814208984375, 21.47509765625, 22.135986328125, 22.796875]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 7.0, 7.0, 16.0, 21.0, 18.0, 21.0, 38.0, 58.0, 85.0, 87.0, 138.0, 187.0, 256.0, 395.0, 480.0, 550.0, 510.0, 377.0, 263.0, 184.0, 101.0, 85.0, 72.0, 24.0, 26.0, 18.0, 14.0, 8.0, 7.0, 4.0, 4.0, 6.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.328125, -18.69482421875, -18.0615234375, -17.42822265625, -16.794921875, -16.16162109375, -15.5283203125, -14.89501953125, -14.26171875, -13.62841796875, -12.9951171875, -12.36181640625, -11.728515625, -11.09521484375, -10.4619140625, -9.82861328125, -9.1953125, -8.56201171875, -7.9287109375, -7.29541015625, -6.662109375, -6.02880859375, -5.3955078125, -4.76220703125, -4.12890625, -3.49560546875, -2.8623046875, -2.22900390625, -1.595703125, -0.96240234375, -0.3291015625, 0.30419921875, 0.9375, 1.57080078125, 2.2041015625, 2.83740234375, 3.470703125, 4.10400390625, 4.7373046875, 5.37060546875, 6.00390625, 6.63720703125, 7.2705078125, 7.90380859375, 8.537109375, 9.17041015625, 9.8037109375, 10.43701171875, 11.0703125, 11.70361328125, 12.3369140625, 12.97021484375, 13.603515625, 14.23681640625, 14.8701171875, 15.50341796875, 16.13671875, 16.77001953125, 17.4033203125, 18.03662109375, 18.669921875, 19.30322265625, 19.9365234375, 20.56982421875, 21.203125]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 4.0, 9.0, 12.0, 16.0, 26.0, 35.0, 46.0, 64.0, 135.0, 277.0, 580.0, 1375.0, 4433.0, 18024.0, 100341.0, 1014939.0, 2742815.0, 261883.0, 36952.0, 8061.0, 2394.0, 853.0, 437.0, 210.0, 115.0, 72.0, 54.0, 34.0, 27.0, 18.0, 14.0, 5.0, 7.0, 10.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-35.90625, -34.857421875, -33.80859375, -32.759765625, -31.7109375, -30.662109375, -29.61328125, -28.564453125, -27.515625, -26.466796875, -25.41796875, -24.369140625, -23.3203125, -22.271484375, -21.22265625, -20.173828125, -19.125, -18.076171875, -17.02734375, -15.978515625, -14.9296875, -13.880859375, -12.83203125, -11.783203125, -10.734375, -9.685546875, -8.63671875, -7.587890625, -6.5390625, -5.490234375, -4.44140625, -3.392578125, -2.34375, -1.294921875, -0.24609375, 0.802734375, 1.8515625, 2.900390625, 3.94921875, 4.998046875, 6.046875, 7.095703125, 8.14453125, 9.193359375, 10.2421875, 11.291015625, 12.33984375, 13.388671875, 14.4375, 15.486328125, 16.53515625, 17.583984375, 18.6328125, 19.681640625, 20.73046875, 21.779296875, 22.828125, 23.876953125, 24.92578125, 25.974609375, 27.0234375, 28.072265625, 29.12109375, 30.169921875, 31.21875]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 28.0, 230.0, 511.0, 219.0, 26.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-140.8870849609375, -129.66104125976562, -118.43499755859375, -107.20895385742188, -95.98291015625, -84.75686645507812, -73.53083038330078, -62.304786682128906, -51.07874298095703, -39.852699279785156, -28.626657485961914, -17.400615692138672, -6.174571990966797, 5.051471710205078, 16.277511596679688, 27.503555297851562, 38.72959899902344, 49.95564270019531, 61.18168640136719, 72.40773010253906, 83.63377380371094, 94.85981750488281, 106.08585357666016, 117.31189727783203, 128.53793334960938, 139.76397705078125, 150.99002075195312, 162.216064453125, 173.44210815429688, 184.66815185546875, 195.89419555664062, 207.1202392578125, 218.34628295898438, 229.57232666015625, 240.79837036132812, 252.0244140625, 263.2504577636719, 274.47650146484375, 285.7025451660156, 296.9285888671875, 308.1546325683594, 319.38067626953125, 330.6067199707031, 341.832763671875, 353.0588073730469, 364.28485107421875, 375.5108947753906, 386.7369384765625, 397.96295166015625, 409.1889953613281, 420.4150390625, 431.6410827636719, 442.86712646484375, 454.0931701660156, 465.3192138671875, 476.5452575683594, 487.77130126953125, 498.9973449707031, 510.223388671875, 521.4494018554688, 532.6754760742188, 543.9014892578125, 555.1275634765625, 566.3535766601562, 577.5796508789062]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 7.0, 4.0, 7.0, 4.0, 10.0, 9.0, 11.0, 9.0, 14.0, 15.0, 14.0, 15.0, 13.0, 24.0, 46.0, 37.0, 35.0, 56.0, 51.0, 34.0, 52.0, 34.0, 35.0, 47.0, 52.0, 30.0, 42.0, 35.0, 35.0, 30.0, 26.0, 33.0, 26.0, 23.0, 19.0, 19.0, 18.0, 10.0, 8.0, 7.0, 3.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-72.07998657226562, -69.99510192871094, -67.91021728515625, -65.82533264160156, -63.740447998046875, -61.65556335449219, -59.5706787109375, -57.48579406738281, -55.400909423828125, -53.31602478027344, -51.23114013671875, -49.14625549316406, -47.061370849609375, -44.97648620605469, -42.8916015625, -40.80671691894531, -38.721832275390625, -36.63694763183594, -34.55206298828125, -32.46717834472656, -30.382293701171875, -28.297409057617188, -26.2125244140625, -24.127639770507812, -22.042755126953125, -19.957870483398438, -17.87298583984375, -15.788101196289062, -13.703216552734375, -11.618331909179688, -9.533447265625, -7.4485626220703125, -5.363677978515625, -3.2787933349609375, -1.19390869140625, 0.8909759521484375, 2.975860595703125, 5.0607452392578125, 7.1456298828125, 9.230514526367188, 11.315399169921875, 13.400283813476562, 15.48516845703125, 17.570053100585938, 19.654937744140625, 21.739822387695312, 23.82470703125, 25.909591674804688, 27.994476318359375, 30.079360961914062, 32.16424560546875, 34.24913024902344, 36.334014892578125, 38.41889953613281, 40.5037841796875, 42.58866882324219, 44.673553466796875, 46.75843811035156, 48.84332275390625, 50.92820739746094, 53.013092041015625, 55.09797668457031, 57.182861328125, 59.26774597167969, 61.352630615234375]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 2.0, 0.0, 3.0, 3.0, 3.0, 8.0, 6.0, 5.0, 13.0, 11.0, 15.0, 9.0, 16.0, 18.0, 33.0, 26.0, 27.0, 30.0, 37.0, 32.0, 31.0, 25.0, 28.0, 43.0, 36.0, 55.0, 49.0, 43.0, 36.0, 46.0, 38.0, 29.0, 25.0, 22.0, 33.0, 26.0, 24.0, 20.0, 12.0, 21.0, 20.0, 13.0, 12.0, 11.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.203125, -12.808349609375, -12.41357421875, -12.018798828125, -11.6240234375, -11.229248046875, -10.83447265625, -10.439697265625, -10.044921875, -9.650146484375, -9.25537109375, -8.860595703125, -8.4658203125, -8.071044921875, -7.67626953125, -7.281494140625, -6.88671875, -6.491943359375, -6.09716796875, -5.702392578125, -5.3076171875, -4.912841796875, -4.51806640625, -4.123291015625, -3.728515625, -3.333740234375, -2.93896484375, -2.544189453125, -2.1494140625, -1.754638671875, -1.35986328125, -0.965087890625, -0.5703125, -0.175537109375, 0.21923828125, 0.614013671875, 1.0087890625, 1.403564453125, 1.79833984375, 2.193115234375, 2.587890625, 2.982666015625, 3.37744140625, 3.772216796875, 4.1669921875, 4.561767578125, 4.95654296875, 5.351318359375, 5.74609375, 6.140869140625, 6.53564453125, 6.930419921875, 7.3251953125, 7.719970703125, 8.11474609375, 8.509521484375, 8.904296875, 9.299072265625, 9.69384765625, 10.088623046875, 10.4833984375, 10.878173828125, 11.27294921875, 11.667724609375, 12.0625]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 5.0, 4.0, 4.0, 12.0, 15.0, 32.0, 34.0, 55.0, 98.0, 117.0, 155.0, 267.0, 346.0, 491.0, 743.0, 1058.0, 1466.0, 2104.0, 3006.0, 4270.0, 6084.0, 8860.0, 13130.0, 19236.0, 27935.0, 42005.0, 62051.0, 88984.0, 120644.0, 145206.0, 139930.0, 110810.0, 79156.0, 54505.0, 36816.0, 24662.0, 16739.0, 11432.0, 7897.0, 5428.0, 3881.0, 2641.0, 1838.0, 1351.0, 924.0, 680.0, 430.0, 307.0, 221.0, 157.0, 117.0, 73.0, 57.0, 41.0, 22.0, 12.0, 6.0, 11.0, 5.0, 1.0, 3.0], "bins": [-0.79638671875, -0.7721328735351562, -0.7478790283203125, -0.7236251831054688, -0.699371337890625, -0.6751174926757812, -0.6508636474609375, -0.6266098022460938, -0.60235595703125, -0.5781021118164062, -0.5538482666015625, -0.5295944213867188, -0.505340576171875, -0.48108673095703125, -0.4568328857421875, -0.43257904052734375, -0.4083251953125, -0.38407135009765625, -0.3598175048828125, -0.33556365966796875, -0.311309814453125, -0.28705596923828125, -0.2628021240234375, -0.23854827880859375, -0.21429443359375, -0.19004058837890625, -0.1657867431640625, -0.14153289794921875, -0.117279052734375, -0.09302520751953125, -0.0687713623046875, -0.04451751708984375, -0.020263671875, 0.00399017333984375, 0.0282440185546875, 0.05249786376953125, 0.076751708984375, 0.10100555419921875, 0.1252593994140625, 0.14951324462890625, 0.17376708984375, 0.19802093505859375, 0.2222747802734375, 0.24652862548828125, 0.270782470703125, 0.29503631591796875, 0.3192901611328125, 0.34354400634765625, 0.3677978515625, 0.39205169677734375, 0.4163055419921875, 0.44055938720703125, 0.464813232421875, 0.48906707763671875, 0.5133209228515625, 0.5375747680664062, 0.56182861328125, 0.5860824584960938, 0.6103363037109375, 0.6345901489257812, 0.658843994140625, 0.6830978393554688, 0.7073516845703125, 0.7316055297851562, 0.755859375]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 3.0, 5.0, 5.0, 3.0, 6.0, 8.0, 10.0, 17.0, 14.0, 17.0, 20.0, 25.0, 22.0, 32.0, 28.0, 38.0, 35.0, 40.0, 43.0, 36.0, 41.0, 1074.0, 41.0, 52.0, 54.0, 34.0, 33.0, 45.0, 35.0, 33.0, 34.0, 31.0, 20.0, 15.0, 15.0, 14.0, 14.0, 13.0, 11.0, 5.0, 4.0, 3.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-9.6953125, -9.4061279296875, -9.116943359375, -8.8277587890625, -8.53857421875, -8.2493896484375, -7.960205078125, -7.6710205078125, -7.3818359375, -7.0926513671875, -6.803466796875, -6.5142822265625, -6.22509765625, -5.9359130859375, -5.646728515625, -5.3575439453125, -5.068359375, -4.7791748046875, -4.489990234375, -4.2008056640625, -3.91162109375, -3.6224365234375, -3.333251953125, -3.0440673828125, -2.7548828125, -2.4656982421875, -2.176513671875, -1.8873291015625, -1.59814453125, -1.3089599609375, -1.019775390625, -0.7305908203125, -0.44140625, -0.1522216796875, 0.136962890625, 0.4261474609375, 0.71533203125, 1.0045166015625, 1.293701171875, 1.5828857421875, 1.8720703125, 2.1612548828125, 2.450439453125, 2.7396240234375, 3.02880859375, 3.3179931640625, 3.607177734375, 3.8963623046875, 4.185546875, 4.4747314453125, 4.763916015625, 5.0531005859375, 5.34228515625, 5.6314697265625, 5.920654296875, 6.2098388671875, 6.4990234375, 6.7882080078125, 7.077392578125, 7.3665771484375, 7.65576171875, 7.9449462890625, 8.234130859375, 8.5233154296875, 8.8125]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 8.0, 13.0, 14.0, 12.0, 30.0, 45.0, 63.0, 95.0, 144.0, 223.0, 368.0, 550.0, 841.0, 1300.0, 2147.0, 3255.0, 5290.0, 8192.0, 13191.0, 20983.0, 33607.0, 53595.0, 81597.0, 116238.0, 185443.0, 1164962.0, 133073.0, 96207.0, 64617.0, 41367.0, 25982.0, 16175.0, 10012.0, 6289.0, 4052.0, 2531.0, 1586.0, 1029.0, 686.0, 451.0, 291.0, 190.0, 141.0, 77.0, 60.0, 40.0, 21.0, 15.0, 15.0, 6.0, 9.0, 4.0, 2.0, 1.0, 3.0, 2.0], "bins": [-0.69580078125, -0.6748580932617188, -0.6539154052734375, -0.6329727172851562, -0.612030029296875, -0.5910873413085938, -0.5701446533203125, -0.5492019653320312, -0.52825927734375, -0.5073165893554688, -0.4863739013671875, -0.46543121337890625, -0.444488525390625, -0.42354583740234375, -0.4026031494140625, -0.38166046142578125, -0.3607177734375, -0.33977508544921875, -0.3188323974609375, -0.29788970947265625, -0.276947021484375, -0.25600433349609375, -0.2350616455078125, -0.21411895751953125, -0.19317626953125, -0.17223358154296875, -0.1512908935546875, -0.13034820556640625, -0.109405517578125, -0.08846282958984375, -0.0675201416015625, -0.04657745361328125, -0.025634765625, -0.00469207763671875, 0.0162506103515625, 0.03719329833984375, 0.058135986328125, 0.07907867431640625, 0.1000213623046875, 0.12096405029296875, 0.14190673828125, 0.16284942626953125, 0.1837921142578125, 0.20473480224609375, 0.225677490234375, 0.24662017822265625, 0.2675628662109375, 0.28850555419921875, 0.3094482421875, 0.33039093017578125, 0.3513336181640625, 0.37227630615234375, 0.393218994140625, 0.41416168212890625, 0.4351043701171875, 0.45604705810546875, 0.47698974609375, 0.49793243408203125, 0.5188751220703125, 0.5398178100585938, 0.560760498046875, 0.5817031860351562, 0.6026458740234375, 0.6235885620117188, 0.64453125]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 4.0, 2.0, 4.0, 7.0, 13.0, 7.0, 8.0, 14.0, 20.0, 15.0, 35.0, 40.0, 60.0, 66.0, 76.0, 107.0, 113.0, 89.0, 84.0, 62.0, 52.0, 35.0, 26.0, 17.0, 16.0, 13.0, 9.0, 5.0, 2.0, 5.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.015411376953125, -0.014655113220214844, -0.013898849487304688, -0.013142585754394531, -0.012386322021484375, -0.011630058288574219, -0.010873794555664062, -0.010117530822753906, -0.00936126708984375, -0.008605003356933594, -0.007848739624023438, -0.007092475891113281, -0.006336212158203125, -0.005579948425292969, -0.0048236846923828125, -0.004067420959472656, -0.0033111572265625, -0.0025548934936523438, -0.0017986297607421875, -0.0010423660278320312, -0.000286102294921875, 0.00047016143798828125, 0.0012264251708984375, 0.0019826889038085938, 0.00273895263671875, 0.0034952163696289062, 0.0042514801025390625, 0.005007743835449219, 0.005764007568359375, 0.006520271301269531, 0.0072765350341796875, 0.008032798767089844, 0.0087890625, 0.009545326232910156, 0.010301589965820312, 0.011057853698730469, 0.011814117431640625, 0.012570381164550781, 0.013326644897460938, 0.014082908630371094, 0.01483917236328125, 0.015595436096191406, 0.016351699829101562, 0.01710796356201172, 0.017864227294921875, 0.01862049102783203, 0.019376754760742188, 0.020133018493652344, 0.0208892822265625, 0.021645545959472656, 0.022401809692382812, 0.02315807342529297, 0.023914337158203125, 0.02467060089111328, 0.025426864624023438, 0.026183128356933594, 0.02693939208984375, 0.027695655822753906, 0.028451919555664062, 0.02920818328857422, 0.029964447021484375, 0.03072071075439453, 0.03147697448730469, 0.032233238220214844, 0.032989501953125]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 7.0, 2.0, 3.0, 5.0, 12.0, 12.0, 14.0, 23.0, 26.0, 46.0, 59.0, 77.0, 159.0, 288.0, 589.0, 10730.0, 1027500.0, 7667.0, 556.0, 294.0, 162.0, 104.0, 55.0, 41.0, 32.0, 26.0, 20.0, 18.0, 11.0, 10.0, 6.0, 3.0, 4.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.66015625, -0.6449699401855469, -0.6297836303710938, -0.6145973205566406, -0.5994110107421875, -0.5842247009277344, -0.5690383911132812, -0.5538520812988281, -0.538665771484375, -0.5234794616699219, -0.5082931518554688, -0.4931068420410156, -0.4779205322265625, -0.4627342224121094, -0.44754791259765625, -0.4323616027832031, -0.41717529296875, -0.4019889831542969, -0.38680267333984375, -0.3716163635253906, -0.3564300537109375, -0.3412437438964844, -0.32605743408203125, -0.3108711242675781, -0.295684814453125, -0.2804985046386719, -0.26531219482421875, -0.2501258850097656, -0.2349395751953125, -0.21975326538085938, -0.20456695556640625, -0.18938064575195312, -0.1741943359375, -0.15900802612304688, -0.14382171630859375, -0.12863540649414062, -0.1134490966796875, -0.09826278686523438, -0.08307647705078125, -0.06789016723632812, -0.052703857421875, -0.037517547607421875, -0.02233123779296875, -0.007144927978515625, 0.0080413818359375, 0.023227691650390625, 0.03841400146484375, 0.053600311279296875, 0.06878662109375, 0.08397293090820312, 0.09915924072265625, 0.11434555053710938, 0.1295318603515625, 0.14471817016601562, 0.15990447998046875, 0.17509078979492188, 0.190277099609375, 0.20546340942382812, 0.22064971923828125, 0.23583602905273438, 0.2510223388671875, 0.2662086486816406, 0.28139495849609375, 0.2965812683105469, 0.311767578125]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [20.0, 777.0, 217.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.008801125921308994, -0.003829937893897295, 0.0011412501335144043, 0.006112438626587391, 0.011083626188337803, 0.01605481281876564, 0.02102600410580635, 0.025997191667556763, 0.030968379229307175, 0.03593956679105759, 0.040910754352808, 0.04588194191455841, 0.05085313320159912, 0.055824317038059235, 0.060795508325099945, 0.06576669216156006, 0.07073788344860077, 0.07570907473564148, 0.08068025857210159, 0.0856514498591423, 0.09062263369560242, 0.09559382498264313, 0.10056501626968384, 0.10553620010614395, 0.11050738394260406, 0.11547857522964478, 0.12044975906610489, 0.125420942902565, 0.1303921341896057, 0.13536332547664642, 0.14033451676368713, 0.14530569314956665, 0.15027688443660736, 0.15524807572364807, 0.16021926701068878, 0.1651904433965683, 0.170161634683609, 0.17513282597064972, 0.18010401725769043, 0.18507519364356995, 0.19004638493061066, 0.19501757621765137, 0.19998876750469208, 0.2049599438905716, 0.2099311351776123, 0.21490232646465302, 0.21987351775169373, 0.22484469413757324, 0.22981590032577515, 0.23478709161281586, 0.23975828289985657, 0.24472945928573608, 0.2497006505727768, 0.2546718418598175, 0.259643018245697, 0.2646142244338989, 0.26958540081977844, 0.27455657720565796, 0.27952778339385986, 0.2844989597797394, 0.2894701659679413, 0.2944413423538208, 0.2994125187397003, 0.3043837249279022, 0.30935490131378174]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 10.0, 2.0, 7.0, 8.0, 13.0, 13.0, 15.0, 23.0, 34.0, 40.0, 46.0, 46.0, 47.0, 58.0, 58.0, 71.0, 47.0, 53.0, 54.0, 56.0, 60.0, 63.0, 35.0, 27.0, 32.0, 19.0, 12.0, 17.0, 10.0, 6.0, 10.0, 8.0, 4.0, 4.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.015604794025421143, -0.015161249786615372, -0.0147177055478096, -0.01427416130900383, -0.013830617070198059, -0.013387072831392288, -0.012943528592586517, -0.012499984353780746, -0.012056440114974976, -0.011612895876169205, -0.011169351637363434, -0.010725807398557663, -0.010282263159751892, -0.009838718920946121, -0.00939517468214035, -0.00895163044333458, -0.008508086204528809, -0.008064541965723038, -0.007620997726917267, -0.007177453488111496, -0.006733909249305725, -0.006290365010499954, -0.005846820771694183, -0.0054032765328884125, -0.004959732294082642, -0.004516188055276871, -0.0040726438164711, -0.003629099577665329, -0.003185555338859558, -0.0027420111000537872, -0.0022984668612480164, -0.0018549226224422455, -0.0014113783836364746, -0.0009678341448307037, -0.0005242899060249329, -8.074566721916199e-05, 0.0003627985715866089, 0.0008063428103923798, 0.0012498870491981506, 0.0016934312880039215, 0.0021369755268096924, 0.0025805197656154633, 0.003024064004421234, 0.003467608243227005, 0.003911152482032776, 0.004354696720838547, 0.004798240959644318, 0.0052417851984500885, 0.005685329437255859, 0.00612887367606163, 0.006572417914867401, 0.007015962153673172, 0.007459506392478943, 0.007903050631284714, 0.008346594870090485, 0.008790139108896255, 0.009233683347702026, 0.009677227586507797, 0.010120771825313568, 0.010564316064119339, 0.01100786030292511, 0.01145140454173088, 0.011894948780536652, 0.012338493019342422, 0.012782037258148193]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 2.0, 0.0, 3.0, 3.0, 3.0, 8.0, 6.0, 5.0, 13.0, 10.0, 16.0, 9.0, 16.0, 18.0, 33.0, 26.0, 27.0, 30.0, 37.0, 32.0, 31.0, 25.0, 28.0, 43.0, 36.0, 55.0, 49.0, 43.0, 36.0, 46.0, 38.0, 29.0, 25.0, 22.0, 33.0, 26.0, 24.0, 20.0, 12.0, 21.0, 20.0, 13.0, 12.0, 11.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.203125, -12.808349609375, -12.41357421875, -12.018798828125, -11.6240234375, -11.229248046875, -10.83447265625, -10.439697265625, -10.044921875, -9.650146484375, -9.25537109375, -8.860595703125, -8.4658203125, -8.071044921875, -7.67626953125, -7.281494140625, -6.88671875, -6.491943359375, -6.09716796875, -5.702392578125, -5.3076171875, -4.912841796875, -4.51806640625, -4.123291015625, -3.728515625, -3.333740234375, -2.93896484375, -2.544189453125, -2.1494140625, -1.754638671875, -1.35986328125, -0.965087890625, -0.5703125, -0.175537109375, 0.21923828125, 0.614013671875, 1.0087890625, 1.403564453125, 1.79833984375, 2.193115234375, 2.587890625, 2.982666015625, 3.37744140625, 3.772216796875, 4.1669921875, 4.561767578125, 4.95654296875, 5.351318359375, 5.74609375, 6.140869140625, 6.53564453125, 6.930419921875, 7.3251953125, 7.719970703125, 8.11474609375, 8.509521484375, 8.904296875, 9.299072265625, 9.69384765625, 10.088623046875, 10.4833984375, 10.878173828125, 11.27294921875, 11.667724609375, 12.0625]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 5.0, 8.0, 7.0, 9.0, 6.0, 18.0, 21.0, 26.0, 46.0, 52.0, 77.0, 102.0, 146.0, 218.0, 360.0, 566.0, 1014.0, 1697.0, 3283.0, 6873.0, 14899.0, 34366.0, 86260.0, 249363.0, 391718.0, 154689.0, 57392.0, 23730.0, 10560.0, 4979.0, 2463.0, 1381.0, 809.0, 446.0, 328.0, 189.0, 123.0, 82.0, 71.0, 40.0, 38.0, 22.0, 19.0, 16.0, 14.0, 5.0, 8.0, 5.0, 4.0, 1.0, 4.0, 1.0, 3.0, 1.0, 1.0], "bins": [-17.40625, -16.88330078125, -16.3603515625, -15.83740234375, -15.314453125, -14.79150390625, -14.2685546875, -13.74560546875, -13.22265625, -12.69970703125, -12.1767578125, -11.65380859375, -11.130859375, -10.60791015625, -10.0849609375, -9.56201171875, -9.0390625, -8.51611328125, -7.9931640625, -7.47021484375, -6.947265625, -6.42431640625, -5.9013671875, -5.37841796875, -4.85546875, -4.33251953125, -3.8095703125, -3.28662109375, -2.763671875, -2.24072265625, -1.7177734375, -1.19482421875, -0.671875, -0.14892578125, 0.3740234375, 0.89697265625, 1.419921875, 1.94287109375, 2.4658203125, 2.98876953125, 3.51171875, 4.03466796875, 4.5576171875, 5.08056640625, 5.603515625, 6.12646484375, 6.6494140625, 7.17236328125, 7.6953125, 8.21826171875, 8.7412109375, 9.26416015625, 9.787109375, 10.31005859375, 10.8330078125, 11.35595703125, 11.87890625, 12.40185546875, 12.9248046875, 13.44775390625, 13.970703125, 14.49365234375, 15.0166015625, 15.53955078125, 16.0625]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 7.0, 7.0, 2.0, 8.0, 5.0, 5.0, 8.0, 9.0, 13.0, 11.0, 9.0, 17.0, 17.0, 25.0, 21.0, 37.0, 46.0, 37.0, 49.0, 63.0, 74.0, 140.0, 230.0, 1436.0, 213.0, 125.0, 86.0, 54.0, 45.0, 44.0, 25.0, 32.0, 25.0, 26.0, 22.0, 9.0, 15.0, 12.0, 11.0, 14.0, 4.0, 6.0, 6.0, 0.0, 1.0, 4.0, 2.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-33.125, -32.10595703125, -31.0869140625, -30.06787109375, -29.048828125, -28.02978515625, -27.0107421875, -25.99169921875, -24.97265625, -23.95361328125, -22.9345703125, -21.91552734375, -20.896484375, -19.87744140625, -18.8583984375, -17.83935546875, -16.8203125, -15.80126953125, -14.7822265625, -13.76318359375, -12.744140625, -11.72509765625, -10.7060546875, -9.68701171875, -8.66796875, -7.64892578125, -6.6298828125, -5.61083984375, -4.591796875, -3.57275390625, -2.5537109375, -1.53466796875, -0.515625, 0.50341796875, 1.5224609375, 2.54150390625, 3.560546875, 4.57958984375, 5.5986328125, 6.61767578125, 7.63671875, 8.65576171875, 9.6748046875, 10.69384765625, 11.712890625, 12.73193359375, 13.7509765625, 14.77001953125, 15.7890625, 16.80810546875, 17.8271484375, 18.84619140625, 19.865234375, 20.88427734375, 21.9033203125, 22.92236328125, 23.94140625, 24.96044921875, 25.9794921875, 26.99853515625, 28.017578125, 29.03662109375, 30.0556640625, 31.07470703125, 32.09375]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 7.0, 8.0, 10.0, 14.0, 13.0, 13.0, 18.0, 28.0, 44.0, 56.0, 91.0, 120.0, 183.0, 329.0, 721.0, 3848.0, 113189.0, 2952475.0, 69946.0, 2928.0, 638.0, 371.0, 197.0, 121.0, 82.0, 55.0, 58.0, 30.0, 28.0, 21.0, 18.0, 10.0, 14.0, 8.0, 4.0, 0.0, 5.0, 1.0, 2.0, 3.0, 0.0, 2.0, 3.0], "bins": [-81.875, -79.7451171875, -77.615234375, -75.4853515625, -73.35546875, -71.2255859375, -69.095703125, -66.9658203125, -64.8359375, -62.7060546875, -60.576171875, -58.4462890625, -56.31640625, -54.1865234375, -52.056640625, -49.9267578125, -47.796875, -45.6669921875, -43.537109375, -41.4072265625, -39.27734375, -37.1474609375, -35.017578125, -32.8876953125, -30.7578125, -28.6279296875, -26.498046875, -24.3681640625, -22.23828125, -20.1083984375, -17.978515625, -15.8486328125, -13.71875, -11.5888671875, -9.458984375, -7.3291015625, -5.19921875, -3.0693359375, -0.939453125, 1.1904296875, 3.3203125, 5.4501953125, 7.580078125, 9.7099609375, 11.83984375, 13.9697265625, 16.099609375, 18.2294921875, 20.359375, 22.4892578125, 24.619140625, 26.7490234375, 28.87890625, 31.0087890625, 33.138671875, 35.2685546875, 37.3984375, 39.5283203125, 41.658203125, 43.7880859375, 45.91796875, 48.0478515625, 50.177734375, 52.3076171875, 54.4375]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 14.0, 320.0, 590.0, 87.0, 4.0, 0.0, 1.0, 1.0], "bins": [-557.5526123046875, -547.9741821289062, -538.3956909179688, -528.8172607421875, -519.23876953125, -509.66033935546875, -500.0818786621094, -490.50341796875, -480.9249572753906, -471.34649658203125, -461.7680358886719, -452.1895751953125, -442.61114501953125, -433.0326843261719, -423.4542236328125, -413.8757629394531, -404.29730224609375, -394.7188415527344, -385.140380859375, -375.5619201660156, -365.98345947265625, -356.405029296875, -346.8265686035156, -337.24810791015625, -327.6696472167969, -318.0911865234375, -308.5127258300781, -298.93426513671875, -289.3558349609375, -279.7773742675781, -270.19891357421875, -260.6204528808594, -251.0419921875, -241.46353149414062, -231.88507080078125, -222.30662536621094, -212.72816467285156, -203.1497039794922, -193.57125854492188, -183.9927978515625, -174.41433715820312, -164.83587646484375, -155.25741577148438, -145.67897033691406, -136.1005096435547, -126.52204895019531, -116.94359588623047, -107.36514282226562, -97.78668212890625, -88.20822143554688, -78.62976837158203, -69.05131530761719, -59.47285461425781, -49.8943977355957, -40.315940856933594, -30.73748779296875, -21.15903091430664, -11.580574035644531, -2.002117156982422, 7.5763397216796875, 17.154796600341797, 26.733253479003906, 36.311710357666016, 45.89016342163086, 55.468624114990234]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 8.0, 5.0, 6.0, 10.0, 12.0, 9.0, 14.0, 14.0, 12.0, 19.0, 26.0, 37.0, 32.0, 38.0, 39.0, 41.0, 35.0, 41.0, 56.0, 51.0, 44.0, 41.0, 43.0, 41.0, 31.0, 31.0, 41.0, 30.0, 25.0, 32.0, 22.0, 15.0, 18.0, 19.0, 5.0, 10.0, 14.0, 9.0, 10.0, 4.0, 5.0, 7.0, 5.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-81.30076599121094, -79.00665283203125, -76.71253967285156, -74.4184341430664, -72.12432098388672, -69.83020782470703, -67.53610229492188, -65.24198913574219, -62.9478759765625, -60.65376281738281, -58.35965347290039, -56.06554412841797, -53.77143096923828, -51.477317810058594, -49.18320846557617, -46.88909912109375, -44.59498596191406, -42.300872802734375, -40.00676345825195, -37.71265411376953, -35.418540954589844, -33.124427795410156, -30.830318450927734, -28.53620719909668, -26.242095947265625, -23.94798469543457, -21.653873443603516, -19.35976219177246, -17.065650939941406, -14.771539688110352, -12.477428436279297, -10.183317184448242, -7.8892059326171875, -5.595094680786133, -3.300983428955078, -1.0068721771240234, 1.2872390747070312, 3.581350326538086, 5.875461578369141, 8.169572830200195, 10.46368408203125, 12.757795333862305, 15.05190658569336, 17.346017837524414, 19.64012908935547, 21.934240341186523, 24.228351593017578, 26.522462844848633, 28.816574096679688, 31.110685348510742, 33.4047966003418, 35.69890594482422, 37.993019104003906, 40.287132263183594, 42.581241607666016, 44.87535095214844, 47.169464111328125, 49.46357727050781, 51.757686614990234, 54.051795959472656, 56.345909118652344, 58.64002227783203, 60.93413162231445, 63.228240966796875, 65.52235412597656]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 4.0, 1.0, 4.0, 2.0, 7.0, 7.0, 5.0, 9.0, 14.0, 13.0, 23.0, 20.0, 23.0, 18.0, 20.0, 24.0, 25.0, 30.0, 33.0, 43.0, 32.0, 40.0, 39.0, 54.0, 35.0, 34.0, 52.0, 46.0, 45.0, 35.0, 33.0, 33.0, 31.0, 28.0, 18.0, 22.0, 20.0, 9.0, 17.0, 14.0, 12.0, 11.0, 7.0, 10.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-14.4765625, -14.0648193359375, -13.653076171875, -13.2413330078125, -12.82958984375, -12.4178466796875, -12.006103515625, -11.5943603515625, -11.1826171875, -10.7708740234375, -10.359130859375, -9.9473876953125, -9.53564453125, -9.1239013671875, -8.712158203125, -8.3004150390625, -7.888671875, -7.4769287109375, -7.065185546875, -6.6534423828125, -6.24169921875, -5.8299560546875, -5.418212890625, -5.0064697265625, -4.5947265625, -4.1829833984375, -3.771240234375, -3.3594970703125, -2.94775390625, -2.5360107421875, -2.124267578125, -1.7125244140625, -1.30078125, -0.8890380859375, -0.477294921875, -0.0655517578125, 0.34619140625, 0.7579345703125, 1.169677734375, 1.5814208984375, 1.9931640625, 2.4049072265625, 2.816650390625, 3.2283935546875, 3.64013671875, 4.0518798828125, 4.463623046875, 4.8753662109375, 5.287109375, 5.6988525390625, 6.110595703125, 6.5223388671875, 6.93408203125, 7.3458251953125, 7.757568359375, 8.1693115234375, 8.5810546875, 8.9927978515625, 9.404541015625, 9.8162841796875, 10.22802734375, 10.6397705078125, 11.051513671875, 11.4632568359375, 11.875]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 6.0, 6.0, 5.0, 8.0, 6.0, 14.0, 13.0, 16.0, 15.0, 25.0, 33.0, 26.0, 48.0, 51.0, 70.0, 100.0, 130.0, 197.0, 224.0, 288.0, 486.0, 4284.0, 4175731.0, 10550.0, 587.0, 351.0, 222.0, 208.0, 143.0, 86.0, 75.0, 70.0, 43.0, 33.0, 20.0, 21.0, 17.0, 21.0, 16.0, 8.0, 7.0, 7.0, 5.0, 3.0, 3.0, 1.0, 4.0, 3.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-170.375, -164.802734375, -159.23046875, -153.658203125, -148.0859375, -142.513671875, -136.94140625, -131.369140625, -125.796875, -120.224609375, -114.65234375, -109.080078125, -103.5078125, -97.935546875, -92.36328125, -86.791015625, -81.21875, -75.646484375, -70.07421875, -64.501953125, -58.9296875, -53.357421875, -47.78515625, -42.212890625, -36.640625, -31.068359375, -25.49609375, -19.923828125, -14.3515625, -8.779296875, -3.20703125, 2.365234375, 7.9375, 13.509765625, 19.08203125, 24.654296875, 30.2265625, 35.798828125, 41.37109375, 46.943359375, 52.515625, 58.087890625, 63.66015625, 69.232421875, 74.8046875, 80.376953125, 85.94921875, 91.521484375, 97.09375, 102.666015625, 108.23828125, 113.810546875, 119.3828125, 124.955078125, 130.52734375, 136.099609375, 141.671875, 147.244140625, 152.81640625, 158.388671875, 163.9609375, 169.533203125, 175.10546875, 180.677734375, 186.25]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 5.0, 8.0, 9.0, 8.0, 13.0, 13.0, 22.0, 22.0, 46.0, 47.0, 71.0, 113.0, 163.0, 241.0, 359.0, 512.0, 629.0, 595.0, 367.0, 243.0, 169.0, 106.0, 85.0, 61.0, 39.0, 40.0, 22.0, 19.0, 7.0, 8.0, 8.0, 10.0, 7.0, 5.0, 5.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.09375, -15.4404296875, -14.787109375, -14.1337890625, -13.48046875, -12.8271484375, -12.173828125, -11.5205078125, -10.8671875, -10.2138671875, -9.560546875, -8.9072265625, -8.25390625, -7.6005859375, -6.947265625, -6.2939453125, -5.640625, -4.9873046875, -4.333984375, -3.6806640625, -3.02734375, -2.3740234375, -1.720703125, -1.0673828125, -0.4140625, 0.2392578125, 0.892578125, 1.5458984375, 2.19921875, 2.8525390625, 3.505859375, 4.1591796875, 4.8125, 5.4658203125, 6.119140625, 6.7724609375, 7.42578125, 8.0791015625, 8.732421875, 9.3857421875, 10.0390625, 10.6923828125, 11.345703125, 11.9990234375, 12.65234375, 13.3056640625, 13.958984375, 14.6123046875, 15.265625, 15.9189453125, 16.572265625, 17.2255859375, 17.87890625, 18.5322265625, 19.185546875, 19.8388671875, 20.4921875, 21.1455078125, 21.798828125, 22.4521484375, 23.10546875, 23.7587890625, 24.412109375, 25.0654296875, 25.71875]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 4.0, 10.0, 10.0, 14.0, 19.0, 28.0, 28.0, 37.0, 41.0, 41.0, 80.0, 91.0, 282.0, 1878.0, 211897.0, 3964073.0, 14541.0, 670.0, 186.0, 91.0, 56.0, 38.0, 36.0, 26.0, 24.0, 19.0, 19.0, 20.0, 12.0, 6.0, 2.0, 2.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-107.0, -103.4638671875, -99.927734375, -96.3916015625, -92.85546875, -89.3193359375, -85.783203125, -82.2470703125, -78.7109375, -75.1748046875, -71.638671875, -68.1025390625, -64.56640625, -61.0302734375, -57.494140625, -53.9580078125, -50.421875, -46.8857421875, -43.349609375, -39.8134765625, -36.27734375, -32.7412109375, -29.205078125, -25.6689453125, -22.1328125, -18.5966796875, -15.060546875, -11.5244140625, -7.98828125, -4.4521484375, -0.916015625, 2.6201171875, 6.15625, 9.6923828125, 13.228515625, 16.7646484375, 20.30078125, 23.8369140625, 27.373046875, 30.9091796875, 34.4453125, 37.9814453125, 41.517578125, 45.0537109375, 48.58984375, 52.1259765625, 55.662109375, 59.1982421875, 62.734375, 66.2705078125, 69.806640625, 73.3427734375, 76.87890625, 80.4150390625, 83.951171875, 87.4873046875, 91.0234375, 94.5595703125, 98.095703125, 101.6318359375, 105.16796875, 108.7041015625, 112.240234375, 115.7763671875, 119.3125]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 13.0, 113.0, 393.0, 371.0, 107.0, 15.0, 1.0, 1.0, 0.0, 1.0], "bins": [-506.3465270996094, -497.4556884765625, -488.5648498535156, -479.67401123046875, -470.7831726074219, -461.892333984375, -453.0014953613281, -444.11065673828125, -435.2198181152344, -426.3289794921875, -417.4381408691406, -408.54730224609375, -399.6564636230469, -390.765625, -381.8747863769531, -372.98394775390625, -364.09307861328125, -355.2022399902344, -346.3114013671875, -337.4205627441406, -328.52972412109375, -319.6388854980469, -310.748046875, -301.8572082519531, -292.96636962890625, -284.0755310058594, -275.1846923828125, -266.2938537597656, -257.40301513671875, -248.51217651367188, -239.621337890625, -230.73049926757812, -221.8396453857422, -212.9488067626953, -204.05796813964844, -195.16712951660156, -186.2762908935547, -177.3854522705078, -168.49459838867188, -159.603759765625, -150.71292114257812, -141.82208251953125, -132.93124389648438, -124.0404052734375, -115.14956665039062, -106.25872802734375, -97.36788177490234, -88.47704315185547, -79.58621215820312, -70.69537353515625, -61.804534912109375, -52.913692474365234, -44.02285385131836, -35.132015228271484, -26.241172790527344, -17.35033416748047, -8.459495544433594, 0.43134403228759766, 9.322183609008789, 18.213024139404297, 27.103862762451172, 35.99470138549805, 44.88554382324219, 53.77638244628906, 62.66722106933594]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 4.0, 7.0, 3.0, 13.0, 12.0, 10.0, 19.0, 17.0, 13.0, 36.0, 25.0, 28.0, 29.0, 41.0, 34.0, 34.0, 36.0, 36.0, 44.0, 27.0, 50.0, 39.0, 46.0, 56.0, 39.0, 38.0, 34.0, 34.0, 33.0, 24.0, 27.0, 22.0, 13.0, 15.0, 11.0, 13.0, 16.0, 5.0, 8.0, 2.0, 3.0, 4.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.6031265258789, -66.5176010131836, -64.43206787109375, -62.34654235839844, -60.261016845703125, -58.17549133300781, -56.089962005615234, -54.004432678222656, -51.918907165527344, -49.83338165283203, -47.74785232543945, -45.662322998046875, -43.57679748535156, -41.49127197265625, -39.40574264526367, -37.320213317871094, -35.23468780517578, -33.14916229248047, -31.06363296508789, -28.978105545043945, -26.892578125, -24.807050704956055, -22.72152328491211, -20.635995864868164, -18.55046844482422, -16.464941024780273, -14.379413604736328, -12.293886184692383, -10.208358764648438, -8.122831344604492, -6.037303924560547, -3.9517765045166016, -1.866241455078125, 0.2192859649658203, 2.3048133850097656, 4.390340805053711, 6.475868225097656, 8.561395645141602, 10.646923065185547, 12.732450485229492, 14.817977905273438, 16.903505325317383, 18.989032745361328, 21.074560165405273, 23.16008758544922, 25.245615005493164, 27.33114242553711, 29.416669845581055, 31.502197265625, 33.58772277832031, 35.67325210571289, 37.75878143310547, 39.84430694580078, 41.929832458496094, 44.01536178588867, 46.10089111328125, 48.18641662597656, 50.271942138671875, 52.35747146606445, 54.44300079345703, 56.528526306152344, 58.614051818847656, 60.699581146240234, 62.78511047363281, 64.87063598632812]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 1.0, 7.0, 7.0, 9.0, 9.0, 10.0, 19.0, 16.0, 16.0, 27.0, 18.0, 35.0, 37.0, 31.0, 32.0, 36.0, 39.0, 48.0, 40.0, 39.0, 50.0, 48.0, 57.0, 41.0, 46.0, 29.0, 37.0, 25.0, 31.0, 24.0, 25.0, 23.0, 21.0, 11.0, 11.0, 16.0, 6.0, 8.0, 4.0, 4.0, 6.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.3046875, -13.8851318359375, -13.465576171875, -13.0460205078125, -12.62646484375, -12.2069091796875, -11.787353515625, -11.3677978515625, -10.9482421875, -10.5286865234375, -10.109130859375, -9.6895751953125, -9.27001953125, -8.8504638671875, -8.430908203125, -8.0113525390625, -7.591796875, -7.1722412109375, -6.752685546875, -6.3331298828125, -5.91357421875, -5.4940185546875, -5.074462890625, -4.6549072265625, -4.2353515625, -3.8157958984375, -3.396240234375, -2.9766845703125, -2.55712890625, -2.1375732421875, -1.718017578125, -1.2984619140625, -0.87890625, -0.4593505859375, -0.039794921875, 0.3797607421875, 0.79931640625, 1.2188720703125, 1.638427734375, 2.0579833984375, 2.4775390625, 2.8970947265625, 3.316650390625, 3.7362060546875, 4.15576171875, 4.5753173828125, 4.994873046875, 5.4144287109375, 5.833984375, 6.2535400390625, 6.673095703125, 7.0926513671875, 7.51220703125, 7.9317626953125, 8.351318359375, 8.7708740234375, 9.1904296875, 9.6099853515625, 10.029541015625, 10.4490966796875, 10.86865234375, 11.2882080078125, 11.707763671875, 12.1273193359375, 12.546875]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 5.0, 8.0, 12.0, 14.0, 22.0, 36.0, 55.0, 93.0, 143.0, 189.0, 289.0, 476.0, 678.0, 977.0, 1614.0, 2227.0, 3392.0, 4804.0, 7233.0, 10558.0, 15960.0, 23236.0, 34317.0, 50826.0, 72738.0, 101788.0, 132826.0, 147324.0, 127019.0, 95486.0, 68095.0, 47129.0, 32065.0, 21441.0, 14646.0, 10020.0, 6786.0, 4592.0, 3025.0, 2039.0, 1482.0, 1009.0, 607.0, 422.0, 271.0, 204.0, 130.0, 75.0, 66.0, 40.0, 29.0, 20.0, 11.0, 6.0, 3.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.69384765625, -0.6710281372070312, -0.6482086181640625, -0.6253890991210938, -0.602569580078125, -0.5797500610351562, -0.5569305419921875, -0.5341110229492188, -0.51129150390625, -0.48847198486328125, -0.4656524658203125, -0.44283294677734375, -0.420013427734375, -0.39719390869140625, -0.3743743896484375, -0.35155487060546875, -0.3287353515625, -0.30591583251953125, -0.2830963134765625, -0.26027679443359375, -0.237457275390625, -0.21463775634765625, -0.1918182373046875, -0.16899871826171875, -0.14617919921875, -0.12335968017578125, -0.1005401611328125, -0.07772064208984375, -0.054901123046875, -0.03208160400390625, -0.0092620849609375, 0.01355743408203125, 0.036376953125, 0.05919647216796875, 0.0820159912109375, 0.10483551025390625, 0.127655029296875, 0.15047454833984375, 0.1732940673828125, 0.19611358642578125, 0.21893310546875, 0.24175262451171875, 0.2645721435546875, 0.28739166259765625, 0.310211181640625, 0.33303070068359375, 0.3558502197265625, 0.37866973876953125, 0.4014892578125, 0.42430877685546875, 0.4471282958984375, 0.46994781494140625, 0.492767333984375, 0.5155868530273438, 0.5384063720703125, 0.5612258911132812, 0.58404541015625, 0.6068649291992188, 0.6296844482421875, 0.6525039672851562, 0.675323486328125, 0.6981430053710938, 0.7209625244140625, 0.7437820434570312, 0.7666015625]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 3.0, 5.0, 2.0, 6.0, 2.0, 4.0, 3.0, 6.0, 9.0, 9.0, 12.0, 7.0, 23.0, 15.0, 19.0, 20.0, 29.0, 28.0, 35.0, 40.0, 43.0, 44.0, 36.0, 43.0, 44.0, 1072.0, 51.0, 37.0, 35.0, 52.0, 33.0, 22.0, 36.0, 39.0, 30.0, 23.0, 20.0, 21.0, 20.0, 17.0, 15.0, 7.0, 3.0, 2.0, 7.0, 2.0, 2.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.9609375, -7.6923828125, -7.423828125, -7.1552734375, -6.88671875, -6.6181640625, -6.349609375, -6.0810546875, -5.8125, -5.5439453125, -5.275390625, -5.0068359375, -4.73828125, -4.4697265625, -4.201171875, -3.9326171875, -3.6640625, -3.3955078125, -3.126953125, -2.8583984375, -2.58984375, -2.3212890625, -2.052734375, -1.7841796875, -1.515625, -1.2470703125, -0.978515625, -0.7099609375, -0.44140625, -0.1728515625, 0.095703125, 0.3642578125, 0.6328125, 0.9013671875, 1.169921875, 1.4384765625, 1.70703125, 1.9755859375, 2.244140625, 2.5126953125, 2.78125, 3.0498046875, 3.318359375, 3.5869140625, 3.85546875, 4.1240234375, 4.392578125, 4.6611328125, 4.9296875, 5.1982421875, 5.466796875, 5.7353515625, 6.00390625, 6.2724609375, 6.541015625, 6.8095703125, 7.078125, 7.3466796875, 7.615234375, 7.8837890625, 8.15234375, 8.4208984375, 8.689453125, 8.9580078125, 9.2265625]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 5.0, 10.0, 15.0, 12.0, 31.0, 34.0, 76.0, 107.0, 158.0, 313.0, 553.0, 888.0, 1378.0, 2584.0, 4313.0, 7326.0, 12462.0, 21470.0, 36500.0, 60343.0, 98316.0, 146438.0, 1202939.0, 188697.0, 120728.0, 77948.0, 46552.0, 27914.0, 16066.0, 9476.0, 5455.0, 3310.0, 1940.0, 1064.0, 681.0, 366.0, 241.0, 148.0, 82.0, 63.0, 36.0, 33.0, 19.0, 14.0, 11.0, 11.0, 4.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.68115234375, -0.6582489013671875, -0.635345458984375, -0.6124420166015625, -0.58953857421875, -0.5666351318359375, -0.543731689453125, -0.5208282470703125, -0.4979248046875, -0.4750213623046875, -0.452117919921875, -0.4292144775390625, -0.40631103515625, -0.3834075927734375, -0.360504150390625, -0.3376007080078125, -0.314697265625, -0.2917938232421875, -0.268890380859375, -0.2459869384765625, -0.22308349609375, -0.2001800537109375, -0.177276611328125, -0.1543731689453125, -0.1314697265625, -0.1085662841796875, -0.085662841796875, -0.0627593994140625, -0.03985595703125, -0.0169525146484375, 0.005950927734375, 0.0288543701171875, 0.0517578125, 0.0746612548828125, 0.097564697265625, 0.1204681396484375, 0.14337158203125, 0.1662750244140625, 0.189178466796875, 0.2120819091796875, 0.2349853515625, 0.2578887939453125, 0.280792236328125, 0.3036956787109375, 0.32659912109375, 0.3495025634765625, 0.372406005859375, 0.3953094482421875, 0.418212890625, 0.4411163330078125, 0.464019775390625, 0.4869232177734375, 0.50982666015625, 0.5327301025390625, 0.555633544921875, 0.5785369873046875, 0.6014404296875, 0.6243438720703125, 0.647247314453125, 0.6701507568359375, 0.69305419921875, 0.7159576416015625, 0.738861083984375, 0.7617645263671875, 0.78466796875]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 2.0, 3.0, 3.0, 5.0, 9.0, 6.0, 14.0, 17.0, 22.0, 17.0, 23.0, 25.0, 41.0, 45.0, 73.0, 59.0, 73.0, 84.0, 76.0, 73.0, 48.0, 50.0, 41.0, 35.0, 31.0, 26.0, 22.0, 17.0, 12.0, 6.0, 5.0, 7.0, 3.0, 11.0, 5.0, 5.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.025299072265625, -0.024567604064941406, -0.023836135864257812, -0.02310466766357422, -0.022373199462890625, -0.02164173126220703, -0.020910263061523438, -0.020178794860839844, -0.01944732666015625, -0.018715858459472656, -0.017984390258789062, -0.01725292205810547, -0.016521453857421875, -0.01578998565673828, -0.015058517456054688, -0.014327049255371094, -0.0135955810546875, -0.012864112854003906, -0.012132644653320312, -0.011401176452636719, -0.010669708251953125, -0.009938240051269531, -0.009206771850585938, -0.008475303649902344, -0.00774383544921875, -0.007012367248535156, -0.0062808990478515625, -0.005549430847167969, -0.004817962646484375, -0.004086494445800781, -0.0033550262451171875, -0.0026235580444335938, -0.00189208984375, -0.0011606216430664062, -0.0004291534423828125, 0.00030231475830078125, 0.001033782958984375, 0.0017652511596679688, 0.0024967193603515625, 0.0032281875610351562, 0.00395965576171875, 0.004691123962402344, 0.0054225921630859375, 0.006154060363769531, 0.006885528564453125, 0.007616996765136719, 0.008348464965820312, 0.009079933166503906, 0.0098114013671875, 0.010542869567871094, 0.011274337768554688, 0.012005805969238281, 0.012737274169921875, 0.013468742370605469, 0.014200210571289062, 0.014931678771972656, 0.01566314697265625, 0.016394615173339844, 0.017126083374023438, 0.01785755157470703, 0.018589019775390625, 0.01932048797607422, 0.020051956176757812, 0.020783424377441406, 0.021514892578125]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 0.0, 3.0, 5.0, 6.0, 4.0, 9.0, 8.0, 14.0, 9.0, 16.0, 23.0, 15.0, 37.0, 41.0, 61.0, 88.0, 120.0, 170.0, 239.0, 430.0, 983.0, 64288.0, 978073.0, 2383.0, 592.0, 324.0, 155.0, 130.0, 77.0, 61.0, 38.0, 40.0, 24.0, 18.0, 21.0, 11.0, 9.0, 8.0, 2.0, 7.0, 5.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.383056640625, -0.3699455261230469, -0.35683441162109375, -0.3437232971191406, -0.3306121826171875, -0.3175010681152344, -0.30438995361328125, -0.2912788391113281, -0.278167724609375, -0.2650566101074219, -0.25194549560546875, -0.23883438110351562, -0.2257232666015625, -0.21261215209960938, -0.19950103759765625, -0.18638992309570312, -0.17327880859375, -0.16016769409179688, -0.14705657958984375, -0.13394546508789062, -0.1208343505859375, -0.10772323608398438, -0.09461212158203125, -0.08150100708007812, -0.068389892578125, -0.055278778076171875, -0.04216766357421875, -0.029056549072265625, -0.0159454345703125, -0.002834320068359375, 0.01027679443359375, 0.023387908935546875, 0.0364990234375, 0.049610137939453125, 0.06272125244140625, 0.07583236694335938, 0.0889434814453125, 0.10205459594726562, 0.11516571044921875, 0.12827682495117188, 0.141387939453125, 0.15449905395507812, 0.16761016845703125, 0.18072128295898438, 0.1938323974609375, 0.20694351196289062, 0.22005462646484375, 0.23316574096679688, 0.24627685546875, 0.2593879699707031, 0.27249908447265625, 0.2856101989746094, 0.2987213134765625, 0.3118324279785156, 0.32494354248046875, 0.3380546569824219, 0.351165771484375, 0.3642768859863281, 0.37738800048828125, 0.3904991149902344, 0.4036102294921875, 0.4167213439941406, 0.42983245849609375, 0.4429435729980469, 0.4560546875]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 9.0, 62.0, 265.0, 429.0, 195.0, 46.0, 6.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07442733645439148, -0.0729195699095726, -0.07141180336475372, -0.06990403681993484, -0.06839627027511597, -0.06688850373029709, -0.06538073718547821, -0.06387297064065933, -0.06236520782113075, -0.060857441276311874, -0.059349674731492996, -0.05784190818667412, -0.05633414164185524, -0.05482637882232666, -0.05331861227750778, -0.051810845732688904, -0.050303079187870026, -0.04879531264305115, -0.04728754609823227, -0.04577977955341339, -0.04427201300859451, -0.042764246463775635, -0.04125647991895676, -0.03974871709942818, -0.038240946829319, -0.03673318028450012, -0.035225413739681244, -0.033717647194862366, -0.03220988065004349, -0.03070211596786976, -0.02919434942305088, -0.02768658474087715, -0.026178820058703423, -0.024671053513884544, -0.023163286969065666, -0.021655522286891937, -0.02014775574207306, -0.01863998919725418, -0.017132222652435303, -0.015624457038939, -0.014116690494120121, -0.012608923949301243, -0.01110115833580494, -0.009593391790986061, -0.008085625246167183, -0.006577859632670879, -0.005070093087852001, -0.0035623274743556976, -0.0020545609295368195, -0.0005467947339639068, 0.0009609714616090059, 0.0024687377735972404, 0.003976503852754831, 0.005484269931912422, 0.0069920364767313, 0.008499802090227604, 0.010007568635046482, 0.01151533517986536, 0.013023100793361664, 0.014530867338180542, 0.01603863388299942, 0.0175464004278183, 0.019054166972637177, 0.020561931654810905, 0.022069698199629784]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 4.0, 3.0, 7.0, 10.0, 6.0, 14.0, 6.0, 15.0, 18.0, 13.0, 19.0, 18.0, 28.0, 28.0, 27.0, 31.0, 35.0, 26.0, 42.0, 40.0, 44.0, 44.0, 46.0, 56.0, 39.0, 33.0, 35.0, 36.0, 37.0, 33.0, 29.0, 34.0, 22.0, 16.0, 15.0, 21.0, 17.0, 12.0, 7.0, 6.0, 9.0, 7.0, 7.0, 5.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.010846078395843506, -0.010490799322724342, -0.010135520249605179, -0.009780241176486015, -0.009424962103366852, -0.009069683030247688, -0.008714403957128525, -0.008359124884009361, -0.008003845810890198, -0.007648566737771034, -0.007293287664651871, -0.006938008591532707, -0.006582729518413544, -0.00622745044529438, -0.005872171372175217, -0.005516892299056053, -0.00516161322593689, -0.004806334152817726, -0.004451055079698563, -0.004095776006579399, -0.0037404969334602356, -0.003385217860341072, -0.0030299387872219086, -0.002674659714102745, -0.0023193806409835815, -0.001964101567864418, -0.0016088224947452545, -0.001253543421626091, -0.0008982643485069275, -0.000542985275387764, -0.00018770620226860046, 0.00016757287085056305, 0.0005228519439697266, 0.0008781310170888901, 0.0012334100902080536, 0.001588689163327217, 0.0019439682364463806, 0.002299247309565544, 0.0026545263826847076, 0.003009805455803871, 0.0033650845289230347, 0.003720363602042198, 0.004075642675161362, 0.004430921748280525, 0.004786200821399689, 0.005141479894518852, 0.005496758967638016, 0.005852038040757179, 0.006207317113876343, 0.006562596186995506, 0.00691787526011467, 0.007273154333233833, 0.007628433406352997, 0.00798371247947216, 0.008338991552591324, 0.008694270625710487, 0.009049549698829651, 0.009404828771948814, 0.009760107845067978, 0.010115386918187141, 0.010470665991306305, 0.010825945064425468, 0.011181224137544632, 0.011536503210663795, 0.011891782283782959]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 1.0, 7.0, 7.0, 9.0, 9.0, 9.0, 20.0, 16.0, 16.0, 27.0, 18.0, 35.0, 37.0, 31.0, 32.0, 36.0, 39.0, 48.0, 39.0, 40.0, 49.0, 49.0, 56.0, 42.0, 44.0, 30.0, 37.0, 26.0, 30.0, 25.0, 25.0, 23.0, 21.0, 11.0, 11.0, 16.0, 6.0, 8.0, 4.0, 4.0, 6.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.3046875, -13.88525390625, -13.4658203125, -13.04638671875, -12.626953125, -12.20751953125, -11.7880859375, -11.36865234375, -10.94921875, -10.52978515625, -10.1103515625, -9.69091796875, -9.271484375, -8.85205078125, -8.4326171875, -8.01318359375, -7.59375, -7.17431640625, -6.7548828125, -6.33544921875, -5.916015625, -5.49658203125, -5.0771484375, -4.65771484375, -4.23828125, -3.81884765625, -3.3994140625, -2.97998046875, -2.560546875, -2.14111328125, -1.7216796875, -1.30224609375, -0.8828125, -0.46337890625, -0.0439453125, 0.37548828125, 0.794921875, 1.21435546875, 1.6337890625, 2.05322265625, 2.47265625, 2.89208984375, 3.3115234375, 3.73095703125, 4.150390625, 4.56982421875, 4.9892578125, 5.40869140625, 5.828125, 6.24755859375, 6.6669921875, 7.08642578125, 7.505859375, 7.92529296875, 8.3447265625, 8.76416015625, 9.18359375, 9.60302734375, 10.0224609375, 10.44189453125, 10.861328125, 11.28076171875, 11.7001953125, 12.11962890625, 12.5390625]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 2.0, 4.0, 6.0, 2.0, 11.0, 12.0, 13.0, 24.0, 31.0, 40.0, 61.0, 76.0, 88.0, 131.0, 170.0, 241.0, 325.0, 414.0, 566.0, 769.0, 1108.0, 1765.0, 3329.0, 8623.0, 32425.0, 146019.0, 516007.0, 254557.0, 56636.0, 13814.0, 4524.0, 2110.0, 1320.0, 840.0, 635.0, 462.0, 344.0, 281.0, 208.0, 150.0, 103.0, 81.0, 68.0, 44.0, 34.0, 18.0, 18.0, 19.0, 10.0, 10.0, 5.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0], "bins": [-22.296875, -21.61474609375, -20.9326171875, -20.25048828125, -19.568359375, -18.88623046875, -18.2041015625, -17.52197265625, -16.83984375, -16.15771484375, -15.4755859375, -14.79345703125, -14.111328125, -13.42919921875, -12.7470703125, -12.06494140625, -11.3828125, -10.70068359375, -10.0185546875, -9.33642578125, -8.654296875, -7.97216796875, -7.2900390625, -6.60791015625, -5.92578125, -5.24365234375, -4.5615234375, -3.87939453125, -3.197265625, -2.51513671875, -1.8330078125, -1.15087890625, -0.46875, 0.21337890625, 0.8955078125, 1.57763671875, 2.259765625, 2.94189453125, 3.6240234375, 4.30615234375, 4.98828125, 5.67041015625, 6.3525390625, 7.03466796875, 7.716796875, 8.39892578125, 9.0810546875, 9.76318359375, 10.4453125, 11.12744140625, 11.8095703125, 12.49169921875, 13.173828125, 13.85595703125, 14.5380859375, 15.22021484375, 15.90234375, 16.58447265625, 17.2666015625, 17.94873046875, 18.630859375, 19.31298828125, 19.9951171875, 20.67724609375, 21.359375]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 8.0, 2.0, 10.0, 11.0, 11.0, 19.0, 13.0, 17.0, 27.0, 30.0, 33.0, 40.0, 49.0, 56.0, 51.0, 125.0, 474.0, 1517.0, 138.0, 67.0, 57.0, 53.0, 40.0, 42.0, 33.0, 28.0, 17.0, 16.0, 13.0, 11.0, 3.0, 10.0, 3.0, 11.0, 1.0, 3.0, 5.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-40.4375, -39.28369140625, -38.1298828125, -36.97607421875, -35.822265625, -34.66845703125, -33.5146484375, -32.36083984375, -31.20703125, -30.05322265625, -28.8994140625, -27.74560546875, -26.591796875, -25.43798828125, -24.2841796875, -23.13037109375, -21.9765625, -20.82275390625, -19.6689453125, -18.51513671875, -17.361328125, -16.20751953125, -15.0537109375, -13.89990234375, -12.74609375, -11.59228515625, -10.4384765625, -9.28466796875, -8.130859375, -6.97705078125, -5.8232421875, -4.66943359375, -3.515625, -2.36181640625, -1.2080078125, -0.05419921875, 1.099609375, 2.25341796875, 3.4072265625, 4.56103515625, 5.71484375, 6.86865234375, 8.0224609375, 9.17626953125, 10.330078125, 11.48388671875, 12.6376953125, 13.79150390625, 14.9453125, 16.09912109375, 17.2529296875, 18.40673828125, 19.560546875, 20.71435546875, 21.8681640625, 23.02197265625, 24.17578125, 25.32958984375, 26.4833984375, 27.63720703125, 28.791015625, 29.94482421875, 31.0986328125, 32.25244140625, 33.40625]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 2.0, 2.0, 6.0, 5.0, 4.0, 10.0, 12.0, 11.0, 20.0, 13.0, 23.0, 24.0, 55.0, 50.0, 90.0, 180.0, 305.0, 602.0, 1896.0, 2764949.0, 374669.0, 1497.0, 549.0, 251.0, 157.0, 87.0, 61.0, 38.0, 27.0, 21.0, 17.0, 20.0, 11.0, 10.0, 5.0, 4.0, 3.0, 7.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-111.5625, -107.7060546875, -103.849609375, -99.9931640625, -96.13671875, -92.2802734375, -88.423828125, -84.5673828125, -80.7109375, -76.8544921875, -72.998046875, -69.1416015625, -65.28515625, -61.4287109375, -57.572265625, -53.7158203125, -49.859375, -46.0029296875, -42.146484375, -38.2900390625, -34.43359375, -30.5771484375, -26.720703125, -22.8642578125, -19.0078125, -15.1513671875, -11.294921875, -7.4384765625, -3.58203125, 0.2744140625, 4.130859375, 7.9873046875, 11.84375, 15.7001953125, 19.556640625, 23.4130859375, 27.26953125, 31.1259765625, 34.982421875, 38.8388671875, 42.6953125, 46.5517578125, 50.408203125, 54.2646484375, 58.12109375, 61.9775390625, 65.833984375, 69.6904296875, 73.546875, 77.4033203125, 81.259765625, 85.1162109375, 88.97265625, 92.8291015625, 96.685546875, 100.5419921875, 104.3984375, 108.2548828125, 112.111328125, 115.9677734375, 119.82421875, 123.6806640625, 127.537109375, 131.3935546875, 135.25]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 38.0, 145.0, 308.0, 335.0, 132.0, 44.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-153.91552734375, -149.25157165527344, -144.5876007080078, -139.92364501953125, -135.25967407226562, -130.59571838378906, -125.9317626953125, -121.2677993774414, -116.60383605957031, -111.93987274169922, -107.27590942382812, -102.61195373535156, -97.94799041748047, -93.28402709960938, -88.62007141113281, -83.95610809326172, -79.29214477539062, -74.62818145751953, -69.96421813964844, -65.30026245117188, -60.63629913330078, -55.97233581542969, -51.30837631225586, -46.64441680908203, -41.98045349121094, -37.316490173339844, -32.652530670166016, -27.988569259643555, -23.324607849121094, -18.660646438598633, -13.996685028076172, -9.332725524902344, -4.6687774658203125, -0.0048160552978515625, 4.659145355224609, 9.32310676574707, 13.987068176269531, 18.651029586791992, 23.314990997314453, 27.97895050048828, 32.642913818359375, 37.30687713623047, 41.9708366394043, 46.634796142578125, 51.29875946044922, 55.96272277832031, 60.62668228149414, 65.29064178466797, 69.95460510253906, 74.61856842041016, 79.28253173828125, 83.94648742675781, 88.6104507446289, 93.2744140625, 97.93836975097656, 102.60233306884766, 107.26629638671875, 111.93025970458984, 116.59422302246094, 121.2581787109375, 125.9221420288086, 130.5861053466797, 135.25006103515625, 139.91403198242188, 144.57798767089844]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 2.0, 8.0, 7.0, 4.0, 9.0, 9.0, 11.0, 12.0, 18.0, 22.0, 13.0, 25.0, 24.0, 30.0, 33.0, 41.0, 38.0, 32.0, 47.0, 57.0, 50.0, 51.0, 39.0, 41.0, 29.0, 30.0, 36.0, 33.0, 35.0, 31.0, 29.0, 27.0, 16.0, 24.0, 14.0, 12.0, 9.0, 10.0, 10.0, 6.0, 6.0, 4.0, 4.0, 4.0, 3.0, 0.0, 6.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-81.78633117675781, -79.10333251953125, -76.42033386230469, -73.7373275756836, -71.05432891845703, -68.37133026123047, -65.68832397460938, -63.00532531738281, -60.32232666015625, -57.63932800292969, -54.95632553100586, -52.27332305908203, -49.59032440185547, -46.907325744628906, -44.22432327270508, -41.54132080078125, -38.85832214355469, -36.175323486328125, -33.4923210144043, -30.8093204498291, -28.126319885253906, -25.44331932067871, -22.760318756103516, -20.07731819152832, -17.394317626953125, -14.71131706237793, -12.028316497802734, -9.345315933227539, -6.662315368652344, -3.9793148040771484, -1.2963142395019531, 1.3866863250732422, 4.0696868896484375, 6.752687454223633, 9.435688018798828, 12.118688583374023, 14.801689147949219, 17.484689712524414, 20.16769027709961, 22.850690841674805, 25.53369140625, 28.216691970825195, 30.89969253540039, 33.58269500732422, 36.26569366455078, 38.948692321777344, 41.63169479370117, 44.314697265625, 46.99769592285156, 49.680694580078125, 52.36369705200195, 55.04669952392578, 57.729698181152344, 60.412696838378906, 63.095699310302734, 65.77870178222656, 68.46170043945312, 71.14469909667969, 73.82769775390625, 76.51070404052734, 79.1937026977539, 81.87670135498047, 84.55970764160156, 87.24270629882812, 89.92570495605469]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 3.0, 7.0, 7.0, 11.0, 11.0, 14.0, 10.0, 18.0, 23.0, 33.0, 20.0, 33.0, 34.0, 37.0, 32.0, 37.0, 49.0, 43.0, 32.0, 41.0, 49.0, 51.0, 58.0, 42.0, 40.0, 39.0, 33.0, 23.0, 26.0, 26.0, 25.0, 20.0, 16.0, 13.0, 9.0, 8.0, 8.0, 7.0, 6.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.046875, -13.6156005859375, -13.184326171875, -12.7530517578125, -12.32177734375, -11.8905029296875, -11.459228515625, -11.0279541015625, -10.5966796875, -10.1654052734375, -9.734130859375, -9.3028564453125, -8.87158203125, -8.4403076171875, -8.009033203125, -7.5777587890625, -7.146484375, -6.7152099609375, -6.283935546875, -5.8526611328125, -5.42138671875, -4.9901123046875, -4.558837890625, -4.1275634765625, -3.6962890625, -3.2650146484375, -2.833740234375, -2.4024658203125, -1.97119140625, -1.5399169921875, -1.108642578125, -0.6773681640625, -0.24609375, 0.1851806640625, 0.616455078125, 1.0477294921875, 1.47900390625, 1.9102783203125, 2.341552734375, 2.7728271484375, 3.2041015625, 3.6353759765625, 4.066650390625, 4.4979248046875, 4.92919921875, 5.3604736328125, 5.791748046875, 6.2230224609375, 6.654296875, 7.0855712890625, 7.516845703125, 7.9481201171875, 8.37939453125, 8.8106689453125, 9.241943359375, 9.6732177734375, 10.1044921875, 10.5357666015625, 10.967041015625, 11.3983154296875, 11.82958984375, 12.2608642578125, 12.692138671875, 13.1234130859375, 13.5546875]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 2.0, 7.0, 11.0, 6.0, 7.0, 20.0, 21.0, 18.0, 23.0, 43.0, 44.0, 49.0, 78.0, 113.0, 182.0, 291.0, 434.0, 679.0, 1371.0, 2460.0, 5207.0, 13236.0, 44537.0, 225093.0, 1164540.0, 1992854.0, 594021.0, 107458.0, 24727.0, 8398.0, 3757.0, 1861.0, 993.0, 601.0, 359.0, 242.0, 122.0, 113.0, 65.0, 50.0, 40.0, 35.0, 34.0, 17.0, 14.0, 14.0, 11.0, 7.0, 5.0, 9.0, 3.0, 0.0, 4.0, 0.0, 3.0], "bins": [-21.859375, -21.2216796875, -20.583984375, -19.9462890625, -19.30859375, -18.6708984375, -18.033203125, -17.3955078125, -16.7578125, -16.1201171875, -15.482421875, -14.8447265625, -14.20703125, -13.5693359375, -12.931640625, -12.2939453125, -11.65625, -11.0185546875, -10.380859375, -9.7431640625, -9.10546875, -8.4677734375, -7.830078125, -7.1923828125, -6.5546875, -5.9169921875, -5.279296875, -4.6416015625, -4.00390625, -3.3662109375, -2.728515625, -2.0908203125, -1.453125, -0.8154296875, -0.177734375, 0.4599609375, 1.09765625, 1.7353515625, 2.373046875, 3.0107421875, 3.6484375, 4.2861328125, 4.923828125, 5.5615234375, 6.19921875, 6.8369140625, 7.474609375, 8.1123046875, 8.75, 9.3876953125, 10.025390625, 10.6630859375, 11.30078125, 11.9384765625, 12.576171875, 13.2138671875, 13.8515625, 14.4892578125, 15.126953125, 15.7646484375, 16.40234375, 17.0400390625, 17.677734375, 18.3154296875, 18.953125]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 4.0, 0.0, 5.0, 3.0, 10.0, 8.0, 4.0, 7.0, 16.0, 15.0, 27.0, 36.0, 33.0, 49.0, 59.0, 72.0, 109.0, 123.0, 137.0, 166.0, 237.0, 297.0, 405.0, 428.0, 371.0, 328.0, 238.0, 190.0, 117.0, 112.0, 108.0, 74.0, 52.0, 47.0, 56.0, 25.0, 19.0, 22.0, 18.0, 11.0, 7.0, 5.0, 4.0, 8.0, 2.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-18.984375, -18.4488525390625, -17.913330078125, -17.3778076171875, -16.84228515625, -16.3067626953125, -15.771240234375, -15.2357177734375, -14.7001953125, -14.1646728515625, -13.629150390625, -13.0936279296875, -12.55810546875, -12.0225830078125, -11.487060546875, -10.9515380859375, -10.416015625, -9.8804931640625, -9.344970703125, -8.8094482421875, -8.27392578125, -7.7384033203125, -7.202880859375, -6.6673583984375, -6.1318359375, -5.5963134765625, -5.060791015625, -4.5252685546875, -3.98974609375, -3.4542236328125, -2.918701171875, -2.3831787109375, -1.84765625, -1.3121337890625, -0.776611328125, -0.2410888671875, 0.29443359375, 0.8299560546875, 1.365478515625, 1.9010009765625, 2.4365234375, 2.9720458984375, 3.507568359375, 4.0430908203125, 4.57861328125, 5.1141357421875, 5.649658203125, 6.1851806640625, 6.720703125, 7.2562255859375, 7.791748046875, 8.3272705078125, 8.86279296875, 9.3983154296875, 9.933837890625, 10.4693603515625, 11.0048828125, 11.5404052734375, 12.075927734375, 12.6114501953125, 13.14697265625, 13.6824951171875, 14.218017578125, 14.7535400390625, 15.2890625]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 7.0, 9.0, 16.0, 16.0, 26.0, 41.0, 65.0, 87.0, 134.0, 220.0, 383.0, 723.0, 1525.0, 4363.0, 22707.0, 236766.0, 3012930.0, 839000.0, 62167.0, 8438.0, 2376.0, 1040.0, 470.0, 251.0, 152.0, 134.0, 73.0, 55.0, 30.0, 18.0, 16.0, 12.0, 13.0, 9.0, 8.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.03125, -40.85498046875, -39.6787109375, -38.50244140625, -37.326171875, -36.14990234375, -34.9736328125, -33.79736328125, -32.62109375, -31.44482421875, -30.2685546875, -29.09228515625, -27.916015625, -26.73974609375, -25.5634765625, -24.38720703125, -23.2109375, -22.03466796875, -20.8583984375, -19.68212890625, -18.505859375, -17.32958984375, -16.1533203125, -14.97705078125, -13.80078125, -12.62451171875, -11.4482421875, -10.27197265625, -9.095703125, -7.91943359375, -6.7431640625, -5.56689453125, -4.390625, -3.21435546875, -2.0380859375, -0.86181640625, 0.314453125, 1.49072265625, 2.6669921875, 3.84326171875, 5.01953125, 6.19580078125, 7.3720703125, 8.54833984375, 9.724609375, 10.90087890625, 12.0771484375, 13.25341796875, 14.4296875, 15.60595703125, 16.7822265625, 17.95849609375, 19.134765625, 20.31103515625, 21.4873046875, 22.66357421875, 23.83984375, 25.01611328125, 26.1923828125, 27.36865234375, 28.544921875, 29.72119140625, 30.8974609375, 32.07373046875, 33.25]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 9.0, 133.0, 511.0, 320.0, 38.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-663.9436645507812, -650.0341186523438, -636.1245727539062, -622.215087890625, -608.3055419921875, -594.39599609375, -580.4864501953125, -566.576904296875, -552.6673583984375, -538.7578125, -524.8482666015625, -510.9387512207031, -497.0292053222656, -483.11968994140625, -469.21014404296875, -455.30059814453125, -441.3910827636719, -427.4815368652344, -413.572021484375, -399.6624755859375, -385.7529296875, -371.8433837890625, -357.9338684082031, -344.0243225097656, -330.11480712890625, -316.20526123046875, -302.2957458496094, -288.3861999511719, -274.4766540527344, -260.567138671875, -246.6575927734375, -232.748046875, -218.83847045898438, -204.92893981933594, -191.01939392089844, -177.10986328125, -163.2003173828125, -149.29078674316406, -135.38125610351562, -121.47171783447266, -107.56217956542969, -93.65264129638672, -79.74310302734375, -65.83357238769531, -51.924034118652344, -38.014495849609375, -24.104965209960938, -10.195426940917969, 3.714111328125, 17.623647689819336, 31.533184051513672, 45.442718505859375, 59.352256774902344, 73.26179504394531, 87.17132568359375, 101.08086395263672, 114.99040222167969, 128.89993286132812, 142.80947875976562, 156.71900939941406, 170.6285400390625, 184.5380859375, 198.44761657714844, 212.35714721679688, 226.26669311523438]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 9.0, 1.0, 10.0, 10.0, 9.0, 11.0, 15.0, 10.0, 18.0, 26.0, 21.0, 22.0, 34.0, 31.0, 25.0, 37.0, 26.0, 38.0, 40.0, 52.0, 44.0, 39.0, 29.0, 34.0, 40.0, 40.0, 25.0, 28.0, 36.0, 24.0, 28.0, 23.0, 26.0, 15.0, 25.0, 12.0, 13.0, 14.0, 10.0, 12.0, 9.0, 6.0, 3.0, 2.0, 3.0, 2.0, 8.0, 6.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-70.35222625732422, -68.11717224121094, -65.88211059570312, -63.64705276489258, -61.41199493408203, -59.176937103271484, -56.94187927246094, -54.70682144165039, -52.471763610839844, -50.2367057800293, -48.00164794921875, -45.7665901184082, -43.531532287597656, -41.29647445678711, -39.06141662597656, -36.826358795166016, -34.59130096435547, -32.35624313354492, -30.121185302734375, -27.886127471923828, -25.65106964111328, -23.416011810302734, -21.180953979492188, -18.94589614868164, -16.710838317871094, -14.475780487060547, -12.24072265625, -10.005664825439453, -7.770606994628906, -5.535549163818359, -3.3004913330078125, -1.0654335021972656, 1.16961669921875, 3.404674530029297, 5.639732360839844, 7.874790191650391, 10.109848022460938, 12.344905853271484, 14.579963684082031, 16.815021514892578, 19.050079345703125, 21.285137176513672, 23.52019500732422, 25.755252838134766, 27.990310668945312, 30.22536849975586, 32.460426330566406, 34.69548416137695, 36.9305419921875, 39.16559982299805, 41.400657653808594, 43.63571548461914, 45.87077331542969, 48.105831146240234, 50.34088897705078, 52.57594680786133, 54.811004638671875, 57.04606246948242, 59.28112030029297, 61.516178131103516, 63.75123596191406, 65.98629760742188, 68.22135162353516, 70.45640563964844, 72.69146728515625]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 7.0, 11.0, 6.0, 14.0, 5.0, 11.0, 17.0, 11.0, 12.0, 20.0, 16.0, 29.0, 22.0, 35.0, 32.0, 38.0, 40.0, 27.0, 40.0, 39.0, 43.0, 42.0, 43.0, 47.0, 33.0, 38.0, 33.0, 33.0, 50.0, 24.0, 26.0, 24.0, 24.0, 16.0, 17.0, 16.0, 11.0, 13.0, 6.0, 7.0, 3.0, 6.0, 4.0, 4.0, 4.0, 4.0, 4.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-10.1484375, -9.8455810546875, -9.542724609375, -9.2398681640625, -8.93701171875, -8.6341552734375, -8.331298828125, -8.0284423828125, -7.7255859375, -7.4227294921875, -7.119873046875, -6.8170166015625, -6.51416015625, -6.2113037109375, -5.908447265625, -5.6055908203125, -5.302734375, -4.9998779296875, -4.697021484375, -4.3941650390625, -4.09130859375, -3.7884521484375, -3.485595703125, -3.1827392578125, -2.8798828125, -2.5770263671875, -2.274169921875, -1.9713134765625, -1.66845703125, -1.3656005859375, -1.062744140625, -0.7598876953125, -0.45703125, -0.1541748046875, 0.148681640625, 0.4515380859375, 0.75439453125, 1.0572509765625, 1.360107421875, 1.6629638671875, 1.9658203125, 2.2686767578125, 2.571533203125, 2.8743896484375, 3.17724609375, 3.4801025390625, 3.782958984375, 4.0858154296875, 4.388671875, 4.6915283203125, 4.994384765625, 5.2972412109375, 5.60009765625, 5.9029541015625, 6.205810546875, 6.5086669921875, 6.8115234375, 7.1143798828125, 7.417236328125, 7.7200927734375, 8.02294921875, 8.3258056640625, 8.628662109375, 8.9315185546875, 9.234375]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 6.0, 12.0, 18.0, 17.0, 41.0, 63.0, 91.0, 123.0, 229.0, 329.0, 500.0, 832.0, 1240.0, 2051.0, 3318.0, 5622.0, 9364.0, 15534.0, 25984.0, 43913.0, 73218.0, 118270.0, 168825.0, 186316.0, 147945.0, 97566.0, 59219.0, 35046.0, 20976.0, 12575.0, 7562.0, 4531.0, 2738.0, 1663.0, 1035.0, 632.0, 397.0, 270.0, 183.0, 100.0, 70.0, 55.0, 27.0, 24.0, 14.0, 10.0, 7.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8076171875, -0.783355712890625, -0.75909423828125, -0.734832763671875, -0.7105712890625, -0.686309814453125, -0.66204833984375, -0.637786865234375, -0.613525390625, -0.589263916015625, -0.56500244140625, -0.540740966796875, -0.5164794921875, -0.492218017578125, -0.46795654296875, -0.443695068359375, -0.41943359375, -0.395172119140625, -0.37091064453125, -0.346649169921875, -0.3223876953125, -0.298126220703125, -0.27386474609375, -0.249603271484375, -0.225341796875, -0.201080322265625, -0.17681884765625, -0.152557373046875, -0.1282958984375, -0.104034423828125, -0.07977294921875, -0.055511474609375, -0.03125, -0.006988525390625, 0.01727294921875, 0.041534423828125, 0.0657958984375, 0.090057373046875, 0.11431884765625, 0.138580322265625, 0.162841796875, 0.187103271484375, 0.21136474609375, 0.235626220703125, 0.2598876953125, 0.284149169921875, 0.30841064453125, 0.332672119140625, 0.35693359375, 0.381195068359375, 0.40545654296875, 0.429718017578125, 0.4539794921875, 0.478240966796875, 0.50250244140625, 0.526763916015625, 0.551025390625, 0.575286865234375, 0.59954833984375, 0.623809814453125, 0.6480712890625, 0.672332763671875, 0.69659423828125, 0.720855712890625, 0.7451171875]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 2.0, 4.0, 6.0, 4.0, 8.0, 7.0, 12.0, 17.0, 9.0, 22.0, 17.0, 16.0, 36.0, 29.0, 37.0, 33.0, 42.0, 35.0, 42.0, 40.0, 38.0, 1064.0, 32.0, 45.0, 39.0, 32.0, 36.0, 35.0, 37.0, 38.0, 30.0, 21.0, 22.0, 19.0, 18.0, 15.0, 11.0, 16.0, 11.0, 9.0, 11.0, 6.0, 5.0, 1.0, 6.0, 3.0, 1.0, 4.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-5.9296875, -5.7373046875, -5.544921875, -5.3525390625, -5.16015625, -4.9677734375, -4.775390625, -4.5830078125, -4.390625, -4.1982421875, -4.005859375, -3.8134765625, -3.62109375, -3.4287109375, -3.236328125, -3.0439453125, -2.8515625, -2.6591796875, -2.466796875, -2.2744140625, -2.08203125, -1.8896484375, -1.697265625, -1.5048828125, -1.3125, -1.1201171875, -0.927734375, -0.7353515625, -0.54296875, -0.3505859375, -0.158203125, 0.0341796875, 0.2265625, 0.4189453125, 0.611328125, 0.8037109375, 0.99609375, 1.1884765625, 1.380859375, 1.5732421875, 1.765625, 1.9580078125, 2.150390625, 2.3427734375, 2.53515625, 2.7275390625, 2.919921875, 3.1123046875, 3.3046875, 3.4970703125, 3.689453125, 3.8818359375, 4.07421875, 4.2666015625, 4.458984375, 4.6513671875, 4.84375, 5.0361328125, 5.228515625, 5.4208984375, 5.61328125, 5.8056640625, 5.998046875, 6.1904296875, 6.3828125]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 7.0, 11.0, 17.0, 24.0, 45.0, 60.0, 88.0, 120.0, 183.0, 309.0, 458.0, 713.0, 1047.0, 1655.0, 2676.0, 4100.0, 6243.0, 9916.0, 15255.0, 23512.0, 36129.0, 54729.0, 79889.0, 110487.0, 175419.0, 1147219.0, 131496.0, 96894.0, 68146.0, 45572.0, 30229.0, 19329.0, 12382.0, 7985.0, 5218.0, 3396.0, 2169.0, 1356.0, 965.0, 561.0, 384.0, 255.0, 191.0, 111.0, 73.0, 42.0, 18.0, 18.0, 17.0, 10.0, 6.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.46875, -0.453765869140625, -0.43878173828125, -0.423797607421875, -0.4088134765625, -0.393829345703125, -0.37884521484375, -0.363861083984375, -0.348876953125, -0.333892822265625, -0.31890869140625, -0.303924560546875, -0.2889404296875, -0.273956298828125, -0.25897216796875, -0.243988037109375, -0.22900390625, -0.214019775390625, -0.19903564453125, -0.184051513671875, -0.1690673828125, -0.154083251953125, -0.13909912109375, -0.124114990234375, -0.109130859375, -0.094146728515625, -0.07916259765625, -0.064178466796875, -0.0491943359375, -0.034210205078125, -0.01922607421875, -0.004241943359375, 0.0107421875, 0.025726318359375, 0.04071044921875, 0.055694580078125, 0.0706787109375, 0.085662841796875, 0.10064697265625, 0.115631103515625, 0.130615234375, 0.145599365234375, 0.16058349609375, 0.175567626953125, 0.1905517578125, 0.205535888671875, 0.22052001953125, 0.235504150390625, 0.25048828125, 0.265472412109375, 0.28045654296875, 0.295440673828125, 0.3104248046875, 0.325408935546875, 0.34039306640625, 0.355377197265625, 0.370361328125, 0.385345458984375, 0.40032958984375, 0.415313720703125, 0.4302978515625, 0.445281982421875, 0.46026611328125, 0.475250244140625, 0.490234375]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0, 5.0, 6.0, 3.0, 7.0, 7.0, 13.0, 8.0, 11.0, 21.0, 23.0, 26.0, 34.0, 44.0, 67.0, 93.0, 138.0, 119.0, 97.0, 81.0, 40.0, 34.0, 18.0, 24.0, 15.0, 8.0, 8.0, 8.0, 3.0, 10.0, 8.0, 4.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.0242767333984375, -0.0236358642578125, -0.0229949951171875, -0.0223541259765625, -0.0217132568359375, -0.0210723876953125, -0.0204315185546875, -0.0197906494140625, -0.0191497802734375, -0.0185089111328125, -0.0178680419921875, -0.0172271728515625, -0.0165863037109375, -0.0159454345703125, -0.0153045654296875, -0.0146636962890625, -0.0140228271484375, -0.0133819580078125, -0.0127410888671875, -0.0121002197265625, -0.0114593505859375, -0.0108184814453125, -0.0101776123046875, -0.0095367431640625, -0.0088958740234375, -0.0082550048828125, -0.0076141357421875, -0.0069732666015625, -0.0063323974609375, -0.0056915283203125, -0.0050506591796875, -0.0044097900390625, -0.0037689208984375, -0.0031280517578125, -0.0024871826171875, -0.0018463134765625, -0.0012054443359375, -0.0005645751953125, 7.62939453125e-05, 0.0007171630859375, 0.0013580322265625, 0.0019989013671875, 0.0026397705078125, 0.0032806396484375, 0.0039215087890625, 0.0045623779296875, 0.0052032470703125, 0.0058441162109375, 0.0064849853515625, 0.0071258544921875, 0.0077667236328125, 0.0084075927734375, 0.0090484619140625, 0.0096893310546875, 0.0103302001953125, 0.0109710693359375, 0.0116119384765625, 0.0122528076171875, 0.0128936767578125, 0.0135345458984375, 0.0141754150390625, 0.0148162841796875, 0.0154571533203125, 0.0160980224609375, 0.0167388916015625]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 5.0, 6.0, 3.0, 11.0, 19.0, 20.0, 7.0, 21.0, 23.0, 21.0, 39.0, 68.0, 73.0, 105.0, 180.0, 332.0, 722.0, 11822.0, 1028823.0, 4686.0, 608.0, 286.0, 178.0, 105.0, 91.0, 64.0, 47.0, 32.0, 28.0, 27.0, 13.0, 14.0, 11.0, 9.0, 5.0, 7.0, 3.0, 4.0, 5.0, 3.0, 9.0, 5.0, 3.0, 2.0, 0.0, 1.0, 6.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 4.0], "bins": [-0.28466796875, -0.273895263671875, -0.26312255859375, -0.252349853515625, -0.2415771484375, -0.230804443359375, -0.22003173828125, -0.209259033203125, -0.198486328125, -0.187713623046875, -0.17694091796875, -0.166168212890625, -0.1553955078125, -0.144622802734375, -0.13385009765625, -0.123077392578125, -0.1123046875, -0.101531982421875, -0.09075927734375, -0.079986572265625, -0.0692138671875, -0.058441162109375, -0.04766845703125, -0.036895751953125, -0.026123046875, -0.015350341796875, -0.00457763671875, 0.006195068359375, 0.0169677734375, 0.027740478515625, 0.03851318359375, 0.049285888671875, 0.06005859375, 0.070831298828125, 0.08160400390625, 0.092376708984375, 0.1031494140625, 0.113922119140625, 0.12469482421875, 0.135467529296875, 0.146240234375, 0.157012939453125, 0.16778564453125, 0.178558349609375, 0.1893310546875, 0.200103759765625, 0.21087646484375, 0.221649169921875, 0.232421875, 0.243194580078125, 0.25396728515625, 0.264739990234375, 0.2755126953125, 0.286285400390625, 0.29705810546875, 0.307830810546875, 0.318603515625, 0.329376220703125, 0.34014892578125, 0.350921630859375, 0.3616943359375, 0.372467041015625, 0.38323974609375, 0.394012451171875, 0.40478515625]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 491.0, 517.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03625253587961197, -0.031077347695827484, -0.025902159512043, -0.020726971328258514, -0.01555178314447403, -0.010376594960689545, -0.00520140677690506, -2.621859312057495e-05, 0.00514896959066391, 0.010324157774448395, 0.01549934595823288, 0.020674534142017365, 0.02584972232580185, 0.031024910509586334, 0.03620009869337082, 0.041375286877155304, 0.04655047506093979, 0.051725663244724274, 0.05690085142850876, 0.06207603961229324, 0.06725122779607773, 0.07242641597986221, 0.0776016041636467, 0.08277679234743118, 0.08795198053121567, 0.09312716871500015, 0.09830235689878464, 0.10347754508256912, 0.10865273326635361, 0.11382792145013809, 0.11900310963392258, 0.12417829781770706, 0.12935349345207214, 0.13452868163585663, 0.1397038698196411, 0.1448790580034256, 0.15005424618721008, 0.15522943437099457, 0.16040462255477905, 0.16557981073856354, 0.17075499892234802, 0.1759301871061325, 0.181105375289917, 0.18628056347370148, 0.19145575165748596, 0.19663093984127045, 0.20180612802505493, 0.20698131620883942, 0.2121565043926239, 0.2173316925764084, 0.22250688076019287, 0.22768206894397736, 0.23285725712776184, 0.23803244531154633, 0.2432076334953308, 0.2483828216791153, 0.2535580098628998, 0.25873321294784546, 0.26390838623046875, 0.26908355951309204, 0.2742587625980377, 0.2794339656829834, 0.2846091389656067, 0.28978431224823, 0.29495951533317566]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 5.0, 5.0, 6.0, 3.0, 8.0, 20.0, 13.0, 14.0, 18.0, 22.0, 38.0, 45.0, 46.0, 40.0, 48.0, 60.0, 57.0, 66.0, 68.0, 48.0, 60.0, 42.0, 45.0, 32.0, 52.0, 32.0, 31.0, 18.0, 16.0, 13.0, 14.0, 10.0, 4.0, 1.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.018145620822906494, -0.01770263910293579, -0.017259659245610237, -0.016816679388284683, -0.01637369766831398, -0.015930715948343277, -0.015487736091017723, -0.015044755302369595, -0.014601774513721466, -0.014158793725073338, -0.013715812936425209, -0.01327283214777708, -0.012829851359128952, -0.012386870570480824, -0.011943889781832695, -0.011500908993184566, -0.011057928204536438, -0.01061494741588831, -0.010171966627240181, -0.009728985838592052, -0.009286005049943924, -0.008843024261295795, -0.008400043472647667, -0.007957062683999538, -0.00751408189535141, -0.007071101106703281, -0.006628120318055153, -0.006185139529407024, -0.005742158740758896, -0.005299177952110767, -0.004856197163462639, -0.00441321637481451, -0.003970235586166382, -0.0035272547975182533, -0.003084274008870125, -0.0026412932202219963, -0.002198312431573868, -0.0017553316429257393, -0.0013123508542776108, -0.0008693700656294823, -0.00042638927698135376, 1.659151166677475e-05, 0.00045957230031490326, 0.0009025530889630318, 0.0013455338776111603, 0.0017885146662592888, 0.0022314954549074173, 0.002674476243555546, 0.0031174570322036743, 0.003560437820851803, 0.004003418609499931, 0.00444639939814806, 0.004889380186796188, 0.005332360975444317, 0.005775341764092445, 0.006218322552740574, 0.006661303341388702, 0.007104284130036831, 0.007547264918684959, 0.007990245707333088, 0.008433226495981216, 0.008876207284629345, 0.009319188073277473, 0.009762168861925602, 0.01020514965057373]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 7.0, 11.0, 6.0, 14.0, 5.0, 11.0, 17.0, 11.0, 12.0, 20.0, 16.0, 29.0, 22.0, 35.0, 32.0, 38.0, 40.0, 27.0, 40.0, 39.0, 43.0, 41.0, 44.0, 47.0, 33.0, 38.0, 33.0, 33.0, 50.0, 24.0, 26.0, 24.0, 24.0, 16.0, 17.0, 16.0, 11.0, 13.0, 6.0, 7.0, 3.0, 6.0, 4.0, 4.0, 4.0, 4.0, 4.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-10.1484375, -9.8455810546875, -9.542724609375, -9.2398681640625, -8.93701171875, -8.6341552734375, -8.331298828125, -8.0284423828125, -7.7255859375, -7.4227294921875, -7.119873046875, -6.8170166015625, -6.51416015625, -6.2113037109375, -5.908447265625, -5.6055908203125, -5.302734375, -4.9998779296875, -4.697021484375, -4.3941650390625, -4.09130859375, -3.7884521484375, -3.485595703125, -3.1827392578125, -2.8798828125, -2.5770263671875, -2.274169921875, -1.9713134765625, -1.66845703125, -1.3656005859375, -1.062744140625, -0.7598876953125, -0.45703125, -0.1541748046875, 0.148681640625, 0.4515380859375, 0.75439453125, 1.0572509765625, 1.360107421875, 1.6629638671875, 1.9658203125, 2.2686767578125, 2.571533203125, 2.8743896484375, 3.17724609375, 3.4801025390625, 3.782958984375, 4.0858154296875, 4.388671875, 4.6915283203125, 4.994384765625, 5.2972412109375, 5.60009765625, 5.9029541015625, 6.205810546875, 6.5086669921875, 6.8115234375, 7.1143798828125, 7.417236328125, 7.7200927734375, 8.02294921875, 8.3258056640625, 8.628662109375, 8.9315185546875, 9.234375]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 3.0, 1.0, 4.0, 7.0, 4.0, 12.0, 10.0, 13.0, 14.0, 30.0, 35.0, 54.0, 69.0, 92.0, 116.0, 181.0, 208.0, 324.0, 462.0, 599.0, 873.0, 1351.0, 2220.0, 4027.0, 9173.0, 33588.0, 244075.0, 621341.0, 97281.0, 17598.0, 6159.0, 3077.0, 1707.0, 1136.0, 738.0, 504.0, 393.0, 304.0, 246.0, 128.0, 108.0, 68.0, 63.0, 39.0, 29.0, 31.0, 24.0, 15.0, 12.0, 4.0, 5.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-22.625, -21.8779296875, -21.130859375, -20.3837890625, -19.63671875, -18.8896484375, -18.142578125, -17.3955078125, -16.6484375, -15.9013671875, -15.154296875, -14.4072265625, -13.66015625, -12.9130859375, -12.166015625, -11.4189453125, -10.671875, -9.9248046875, -9.177734375, -8.4306640625, -7.68359375, -6.9365234375, -6.189453125, -5.4423828125, -4.6953125, -3.9482421875, -3.201171875, -2.4541015625, -1.70703125, -0.9599609375, -0.212890625, 0.5341796875, 1.28125, 2.0283203125, 2.775390625, 3.5224609375, 4.26953125, 5.0166015625, 5.763671875, 6.5107421875, 7.2578125, 8.0048828125, 8.751953125, 9.4990234375, 10.24609375, 10.9931640625, 11.740234375, 12.4873046875, 13.234375, 13.9814453125, 14.728515625, 15.4755859375, 16.22265625, 16.9697265625, 17.716796875, 18.4638671875, 19.2109375, 19.9580078125, 20.705078125, 21.4521484375, 22.19921875, 22.9462890625, 23.693359375, 24.4404296875, 25.1875]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 4.0, 7.0, 9.0, 11.0, 9.0, 12.0, 16.0, 24.0, 25.0, 19.0, 42.0, 43.0, 47.0, 74.0, 53.0, 111.0, 317.0, 1582.0, 162.0, 85.0, 65.0, 58.0, 46.0, 45.0, 30.0, 29.0, 31.0, 20.0, 17.0, 14.0, 16.0, 5.0, 6.0, 4.0, 5.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-32.625, -31.750244140625, -30.87548828125, -30.000732421875, -29.1259765625, -28.251220703125, -27.37646484375, -26.501708984375, -25.626953125, -24.752197265625, -23.87744140625, -23.002685546875, -22.1279296875, -21.253173828125, -20.37841796875, -19.503662109375, -18.62890625, -17.754150390625, -16.87939453125, -16.004638671875, -15.1298828125, -14.255126953125, -13.38037109375, -12.505615234375, -11.630859375, -10.756103515625, -9.88134765625, -9.006591796875, -8.1318359375, -7.257080078125, -6.38232421875, -5.507568359375, -4.6328125, -3.758056640625, -2.88330078125, -2.008544921875, -1.1337890625, -0.259033203125, 0.61572265625, 1.490478515625, 2.365234375, 3.239990234375, 4.11474609375, 4.989501953125, 5.8642578125, 6.739013671875, 7.61376953125, 8.488525390625, 9.36328125, 10.238037109375, 11.11279296875, 11.987548828125, 12.8623046875, 13.737060546875, 14.61181640625, 15.486572265625, 16.361328125, 17.236083984375, 18.11083984375, 18.985595703125, 19.8603515625, 20.735107421875, 21.60986328125, 22.484619140625, 23.359375]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 8.0, 9.0, 3.0, 5.0, 15.0, 15.0, 19.0, 25.0, 43.0, 39.0, 56.0, 103.0, 138.0, 235.0, 328.0, 700.0, 1995.0, 641211.0, 2496677.0, 2282.0, 749.0, 364.0, 218.0, 136.0, 75.0, 76.0, 39.0, 31.0, 27.0, 20.0, 12.0, 14.0, 12.0, 8.0, 10.0, 5.0, 2.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.875, -64.2041015625, -61.533203125, -58.8623046875, -56.19140625, -53.5205078125, -50.849609375, -48.1787109375, -45.5078125, -42.8369140625, -40.166015625, -37.4951171875, -34.82421875, -32.1533203125, -29.482421875, -26.8115234375, -24.140625, -21.4697265625, -18.798828125, -16.1279296875, -13.45703125, -10.7861328125, -8.115234375, -5.4443359375, -2.7734375, -0.1025390625, 2.568359375, 5.2392578125, 7.91015625, 10.5810546875, 13.251953125, 15.9228515625, 18.59375, 21.2646484375, 23.935546875, 26.6064453125, 29.27734375, 31.9482421875, 34.619140625, 37.2900390625, 39.9609375, 42.6318359375, 45.302734375, 47.9736328125, 50.64453125, 53.3154296875, 55.986328125, 58.6572265625, 61.328125, 63.9990234375, 66.669921875, 69.3408203125, 72.01171875, 74.6826171875, 77.353515625, 80.0244140625, 82.6953125, 85.3662109375, 88.037109375, 90.7080078125, 93.37890625, 96.0498046875, 98.720703125, 101.3916015625, 104.0625]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 10.0, 40.0, 159.0, 447.0, 276.0, 71.0, 11.0, 2.0, 0.0, 2.0], "bins": [-359.7062072753906, -353.4726257324219, -347.239013671875, -341.00543212890625, -334.7718200683594, -328.5382385253906, -322.30462646484375, -316.071044921875, -309.8374328613281, -303.6038513183594, -297.3702392578125, -291.13665771484375, -284.9030456542969, -278.6694641113281, -272.43585205078125, -266.2022705078125, -259.96868896484375, -253.73509216308594, -247.50149536132812, -241.2678985595703, -235.0343017578125, -228.8007049560547, -222.56710815429688, -216.33352661132812, -210.09991455078125, -203.86631774902344, -197.63272094726562, -191.3991241455078, -185.16552734375, -178.9319305419922, -172.69833374023438, -166.46475219726562, -160.2311248779297, -153.99752807617188, -147.76393127441406, -141.53033447265625, -135.29673767089844, -129.06314086914062, -122.82955169677734, -116.59595489501953, -110.36236572265625, -104.12876892089844, -97.89517211914062, -91.66157531738281, -85.427978515625, -79.19438171386719, -72.9607925415039, -66.7271957397461, -60.493595123291016, -54.2599983215332, -48.026405334472656, -41.792808532714844, -35.55921173095703, -29.32561492919922, -23.092021942138672, -16.85842514038086, -10.624828338623047, -4.391232490539551, 1.8423633575439453, 8.075958251953125, 14.309555053710938, 20.54315185546875, 26.776744842529297, 33.01034164428711, 39.24393844604492]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 5.0, 4.0, 0.0, 1.0, 5.0, 5.0, 5.0, 7.0, 6.0, 7.0, 7.0, 9.0, 4.0, 13.0, 14.0, 19.0, 23.0, 25.0, 14.0, 23.0, 22.0, 33.0, 35.0, 29.0, 40.0, 36.0, 39.0, 48.0, 44.0, 29.0, 29.0, 44.0, 41.0, 34.0, 40.0, 32.0, 24.0, 34.0, 25.0, 26.0, 28.0, 23.0, 11.0, 14.0, 5.0, 8.0, 13.0, 10.0, 6.0, 4.0, 2.0, 3.0, 7.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-66.68267822265625, -64.56436157226562, -62.44605255126953, -60.32773971557617, -58.20942687988281, -56.09111022949219, -53.97279739379883, -51.85448455810547, -49.73617172241211, -47.61785888671875, -45.49954605102539, -43.38123321533203, -41.262916564941406, -39.14460754394531, -37.02629089355469, -34.90797805786133, -32.78966522216797, -30.67135238647461, -28.55303955078125, -26.434724807739258, -24.3164119720459, -22.19809913635254, -20.079784393310547, -17.961471557617188, -15.843158721923828, -13.724845886230469, -11.606532096862793, -9.488218307495117, -7.369905471801758, -5.251592636108398, -3.1332788467407227, -1.0149650573730469, 1.1033477783203125, 3.22166109085083, 5.339974403381348, 7.458287715911865, 9.576601028442383, 11.694913864135742, 13.813227653503418, 15.931541442871094, 18.049854278564453, 20.168167114257812, 22.286479949951172, 24.404794692993164, 26.523107528686523, 28.641420364379883, 30.759735107421875, 32.878047943115234, 34.996360778808594, 37.11467361450195, 39.23298645019531, 41.35129928588867, 43.46961212158203, 45.587928771972656, 47.706241607666016, 49.824554443359375, 51.942867279052734, 54.061180114746094, 56.17949295043945, 58.29780578613281, 60.41612243652344, 62.53443145751953, 64.65274810791016, 66.77105712890625, 68.88937377929688]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 8.0, 5.0, 7.0, 6.0, 11.0, 6.0, 10.0, 20.0, 18.0, 18.0, 13.0, 22.0, 25.0, 34.0, 23.0, 21.0, 30.0, 34.0, 29.0, 36.0, 39.0, 38.0, 36.0, 42.0, 56.0, 32.0, 40.0, 29.0, 38.0, 24.0, 32.0, 27.0, 30.0, 29.0, 23.0, 22.0, 13.0, 12.0, 12.0, 7.0, 7.0, 13.0, 7.0, 4.0, 3.0, 4.0, 5.0, 3.0, 2.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.15625, -8.8402099609375, -8.524169921875, -8.2081298828125, -7.89208984375, -7.5760498046875, -7.260009765625, -6.9439697265625, -6.6279296875, -6.3118896484375, -5.995849609375, -5.6798095703125, -5.36376953125, -5.0477294921875, -4.731689453125, -4.4156494140625, -4.099609375, -3.7835693359375, -3.467529296875, -3.1514892578125, -2.83544921875, -2.5194091796875, -2.203369140625, -1.8873291015625, -1.5712890625, -1.2552490234375, -0.939208984375, -0.6231689453125, -0.30712890625, 0.0089111328125, 0.324951171875, 0.6409912109375, 0.95703125, 1.2730712890625, 1.589111328125, 1.9051513671875, 2.22119140625, 2.5372314453125, 2.853271484375, 3.1693115234375, 3.4853515625, 3.8013916015625, 4.117431640625, 4.4334716796875, 4.74951171875, 5.0655517578125, 5.381591796875, 5.6976318359375, 6.013671875, 6.3297119140625, 6.645751953125, 6.9617919921875, 7.27783203125, 7.5938720703125, 7.909912109375, 8.2259521484375, 8.5419921875, 8.8580322265625, 9.174072265625, 9.4901123046875, 9.80615234375, 10.1221923828125, 10.438232421875, 10.7542724609375, 11.0703125]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 7.0, 8.0, 9.0, 13.0, 25.0, 33.0, 57.0, 59.0, 113.0, 134.0, 204.0, 353.0, 485.0, 814.0, 1287.0, 2138.0, 3500.0, 6419.0, 13086.0, 34882.0, 156665.0, 808675.0, 1953086.0, 942385.0, 198667.0, 39769.0, 14530.0, 7033.0, 3825.0, 2229.0, 1319.0, 853.0, 524.0, 361.0, 235.0, 147.0, 100.0, 87.0, 52.0, 38.0, 21.0, 13.0, 15.0, 7.0, 8.0, 3.0, 0.0, 5.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.6875, -13.208251953125, -12.72900390625, -12.249755859375, -11.7705078125, -11.291259765625, -10.81201171875, -10.332763671875, -9.853515625, -9.374267578125, -8.89501953125, -8.415771484375, -7.9365234375, -7.457275390625, -6.97802734375, -6.498779296875, -6.01953125, -5.540283203125, -5.06103515625, -4.581787109375, -4.1025390625, -3.623291015625, -3.14404296875, -2.664794921875, -2.185546875, -1.706298828125, -1.22705078125, -0.747802734375, -0.2685546875, 0.210693359375, 0.68994140625, 1.169189453125, 1.6484375, 2.127685546875, 2.60693359375, 3.086181640625, 3.5654296875, 4.044677734375, 4.52392578125, 5.003173828125, 5.482421875, 5.961669921875, 6.44091796875, 6.920166015625, 7.3994140625, 7.878662109375, 8.35791015625, 8.837158203125, 9.31640625, 9.795654296875, 10.27490234375, 10.754150390625, 11.2333984375, 11.712646484375, 12.19189453125, 12.671142578125, 13.150390625, 13.629638671875, 14.10888671875, 14.588134765625, 15.0673828125, 15.546630859375, 16.02587890625, 16.505126953125, 16.984375]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 6.0, 2.0, 4.0, 7.0, 15.0, 12.0, 26.0, 34.0, 41.0, 58.0, 97.0, 121.0, 178.0, 255.0, 354.0, 462.0, 601.0, 470.0, 411.0, 262.0, 199.0, 137.0, 96.0, 77.0, 50.0, 33.0, 25.0, 20.0, 9.0, 6.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.15625, -18.552490234375, -17.94873046875, -17.344970703125, -16.7412109375, -16.137451171875, -15.53369140625, -14.929931640625, -14.326171875, -13.722412109375, -13.11865234375, -12.514892578125, -11.9111328125, -11.307373046875, -10.70361328125, -10.099853515625, -9.49609375, -8.892333984375, -8.28857421875, -7.684814453125, -7.0810546875, -6.477294921875, -5.87353515625, -5.269775390625, -4.666015625, -4.062255859375, -3.45849609375, -2.854736328125, -2.2509765625, -1.647216796875, -1.04345703125, -0.439697265625, 0.1640625, 0.767822265625, 1.37158203125, 1.975341796875, 2.5791015625, 3.182861328125, 3.78662109375, 4.390380859375, 4.994140625, 5.597900390625, 6.20166015625, 6.805419921875, 7.4091796875, 8.012939453125, 8.61669921875, 9.220458984375, 9.82421875, 10.427978515625, 11.03173828125, 11.635498046875, 12.2392578125, 12.843017578125, 13.44677734375, 14.050537109375, 14.654296875, 15.258056640625, 15.86181640625, 16.465576171875, 17.0693359375, 17.673095703125, 18.27685546875, 18.880615234375, 19.484375]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 3.0, 4.0, 8.0, 12.0, 17.0, 16.0, 19.0, 35.0, 49.0, 108.0, 166.0, 269.0, 467.0, 949.0, 2362.0, 13418.0, 645786.0, 3465996.0, 56864.0, 4602.0, 1479.0, 698.0, 355.0, 223.0, 107.0, 95.0, 56.0, 31.0, 30.0, 18.0, 11.0, 14.0, 6.0, 2.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.375, -41.01806640625, -39.6611328125, -38.30419921875, -36.947265625, -35.59033203125, -34.2333984375, -32.87646484375, -31.51953125, -30.16259765625, -28.8056640625, -27.44873046875, -26.091796875, -24.73486328125, -23.3779296875, -22.02099609375, -20.6640625, -19.30712890625, -17.9501953125, -16.59326171875, -15.236328125, -13.87939453125, -12.5224609375, -11.16552734375, -9.80859375, -8.45166015625, -7.0947265625, -5.73779296875, -4.380859375, -3.02392578125, -1.6669921875, -0.31005859375, 1.046875, 2.40380859375, 3.7607421875, 5.11767578125, 6.474609375, 7.83154296875, 9.1884765625, 10.54541015625, 11.90234375, 13.25927734375, 14.6162109375, 15.97314453125, 17.330078125, 18.68701171875, 20.0439453125, 21.40087890625, 22.7578125, 24.11474609375, 25.4716796875, 26.82861328125, 28.185546875, 29.54248046875, 30.8994140625, 32.25634765625, 33.61328125, 34.97021484375, 36.3271484375, 37.68408203125, 39.041015625, 40.39794921875, 41.7548828125, 43.11181640625, 44.46875]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 7.0, 3.0, 6.0, 18.0, 24.0, 63.0, 83.0, 96.0, 126.0, 135.0, 141.0, 114.0, 78.0, 44.0, 39.0, 14.0, 12.0, 1.0, 8.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-97.60442352294922, -95.0711898803711, -92.5379638671875, -90.00473022460938, -87.47149658203125, -84.93826293945312, -82.405029296875, -79.8718032836914, -77.33856964111328, -74.80533599853516, -72.27210998535156, -69.73887634277344, -67.20564270019531, -64.67240905761719, -62.13917922973633, -59.60594940185547, -57.072715759277344, -54.53948211669922, -52.00625228881836, -49.4730224609375, -46.939788818359375, -44.40655517578125, -41.87332534790039, -39.34009552001953, -36.806861877441406, -34.27362823486328, -31.740398406982422, -29.20716667175293, -26.673934936523438, -24.140703201293945, -21.607471466064453, -19.07423973083496, -16.541000366210938, -14.007768630981445, -11.474536895751953, -8.941305160522461, -6.408073425292969, -3.8748416900634766, -1.3416099548339844, 1.1916217803955078, 3.724853515625, 6.258085250854492, 8.791316986083984, 11.324548721313477, 13.857780456542969, 16.39101219177246, 18.924243927001953, 21.457475662231445, 23.990707397460938, 26.52393913269043, 29.057170867919922, 31.590402603149414, 34.123634338378906, 36.65686798095703, 39.19009780883789, 41.72332763671875, 44.256561279296875, 46.789794921875, 49.32302474975586, 51.85625457763672, 54.389488220214844, 56.92272186279297, 59.45595169067383, 61.98918151855469, 64.52241516113281]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 2.0, 5.0, 3.0, 12.0, 16.0, 15.0, 19.0, 18.0, 19.0, 16.0, 16.0, 18.0, 31.0, 21.0, 24.0, 35.0, 42.0, 43.0, 37.0, 27.0, 48.0, 32.0, 45.0, 41.0, 32.0, 31.0, 27.0, 35.0, 40.0, 30.0, 22.0, 24.0, 22.0, 19.0, 28.0, 22.0, 15.0, 7.0, 13.0, 9.0, 7.0, 7.0, 7.0, 7.0, 1.0, 1.0, 3.0, 4.0, 1.0, 4.0, 0.0, 1.0, 2.0], "bins": [-59.865234375, -58.04966354370117, -56.23409652709961, -54.41852569580078, -52.60295486450195, -50.787384033203125, -48.97181701660156, -47.156246185302734, -45.340675354003906, -43.52510452270508, -41.709537506103516, -39.89396667480469, -38.07839584350586, -36.26282501220703, -34.44725799560547, -32.63168716430664, -30.816120147705078, -29.000551223754883, -27.184980392456055, -25.36941146850586, -23.55384063720703, -21.738271713256836, -19.92270278930664, -18.107131958007812, -16.291563034057617, -14.475993156433105, -12.660423278808594, -10.844854354858398, -9.029284477233887, -7.213714599609375, -5.39814567565918, -3.582575798034668, -1.7670059204101562, 0.04856371879577637, 1.864133358001709, 3.6797027587890625, 5.495272636413574, 7.310842514038086, 9.126411437988281, 10.941981315612793, 12.757551193237305, 14.573121070861816, 16.388690948486328, 18.204259872436523, 20.01982879638672, 21.835399627685547, 23.650968551635742, 25.466537475585938, 27.282108306884766, 29.09767723083496, 30.91324806213379, 32.728816986083984, 34.54438781738281, 36.359954833984375, 38.1755256652832, 39.99109649658203, 41.806663513183594, 43.62223434448242, 45.437801361083984, 47.25337219238281, 49.06894302368164, 50.88451385498047, 52.70008087158203, 54.51565170288086, 56.33122253417969]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 7.0, 4.0, 2.0, 2.0, 2.0, 6.0, 6.0, 8.0, 11.0, 10.0, 18.0, 15.0, 19.0, 16.0, 23.0, 19.0, 26.0, 17.0, 35.0, 37.0, 36.0, 34.0, 47.0, 49.0, 48.0, 43.0, 50.0, 31.0, 35.0, 40.0, 31.0, 31.0, 29.0, 38.0, 30.0, 27.0, 13.0, 19.0, 17.0, 12.0, 15.0, 14.0, 7.0, 10.0, 3.0, 6.0, 6.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.1328125, -7.8729248046875, -7.613037109375, -7.3531494140625, -7.09326171875, -6.8333740234375, -6.573486328125, -6.3135986328125, -6.0537109375, -5.7938232421875, -5.533935546875, -5.2740478515625, -5.01416015625, -4.7542724609375, -4.494384765625, -4.2344970703125, -3.974609375, -3.7147216796875, -3.454833984375, -3.1949462890625, -2.93505859375, -2.6751708984375, -2.415283203125, -2.1553955078125, -1.8955078125, -1.6356201171875, -1.375732421875, -1.1158447265625, -0.85595703125, -0.5960693359375, -0.336181640625, -0.0762939453125, 0.18359375, 0.4434814453125, 0.703369140625, 0.9632568359375, 1.22314453125, 1.4830322265625, 1.742919921875, 2.0028076171875, 2.2626953125, 2.5225830078125, 2.782470703125, 3.0423583984375, 3.30224609375, 3.5621337890625, 3.822021484375, 4.0819091796875, 4.341796875, 4.6016845703125, 4.861572265625, 5.1214599609375, 5.38134765625, 5.6412353515625, 5.901123046875, 6.1610107421875, 6.4208984375, 6.6807861328125, 6.940673828125, 7.2005615234375, 7.46044921875, 7.7203369140625, 7.980224609375, 8.2401123046875, 8.5]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 7.0, 4.0, 4.0, 7.0, 10.0, 17.0, 19.0, 29.0, 55.0, 62.0, 107.0, 187.0, 259.0, 412.0, 575.0, 874.0, 1315.0, 2021.0, 3040.0, 4799.0, 7342.0, 11382.0, 18026.0, 28844.0, 45801.0, 71527.0, 106640.0, 146232.0, 168695.0, 142024.0, 102123.0, 67511.0, 43045.0, 27191.0, 17326.0, 11098.0, 7097.0, 4527.0, 2870.0, 1917.0, 1195.0, 787.0, 497.0, 348.0, 218.0, 142.0, 99.0, 86.0, 64.0, 28.0, 36.0, 15.0, 14.0, 4.0, 9.0, 2.0, 1.0, 2.0, 4.0], "bins": [-0.57861328125, -0.561309814453125, -0.54400634765625, -0.526702880859375, -0.5093994140625, -0.492095947265625, -0.47479248046875, -0.457489013671875, -0.440185546875, -0.422882080078125, -0.40557861328125, -0.388275146484375, -0.3709716796875, -0.353668212890625, -0.33636474609375, -0.319061279296875, -0.3017578125, -0.284454345703125, -0.26715087890625, -0.249847412109375, -0.2325439453125, -0.215240478515625, -0.19793701171875, -0.180633544921875, -0.163330078125, -0.146026611328125, -0.12872314453125, -0.111419677734375, -0.0941162109375, -0.076812744140625, -0.05950927734375, -0.042205810546875, -0.02490234375, -0.007598876953125, 0.00970458984375, 0.027008056640625, 0.0443115234375, 0.061614990234375, 0.07891845703125, 0.096221923828125, 0.113525390625, 0.130828857421875, 0.14813232421875, 0.165435791015625, 0.1827392578125, 0.200042724609375, 0.21734619140625, 0.234649658203125, 0.251953125, 0.269256591796875, 0.28656005859375, 0.303863525390625, 0.3211669921875, 0.338470458984375, 0.35577392578125, 0.373077392578125, 0.390380859375, 0.407684326171875, 0.42498779296875, 0.442291259765625, 0.4595947265625, 0.476898193359375, 0.49420166015625, 0.511505126953125, 0.52880859375]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 5.0, 2.0, 8.0, 6.0, 6.0, 5.0, 10.0, 13.0, 13.0, 16.0, 25.0, 23.0, 30.0, 37.0, 24.0, 36.0, 37.0, 41.0, 35.0, 52.0, 34.0, 34.0, 1056.0, 39.0, 36.0, 36.0, 47.0, 41.0, 28.0, 37.0, 21.0, 26.0, 29.0, 19.0, 23.0, 14.0, 13.0, 16.0, 9.0, 13.0, 7.0, 7.0, 5.0, 4.0, 5.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.55859375, -5.384521484375, -5.21044921875, -5.036376953125, -4.8623046875, -4.688232421875, -4.51416015625, -4.340087890625, -4.166015625, -3.991943359375, -3.81787109375, -3.643798828125, -3.4697265625, -3.295654296875, -3.12158203125, -2.947509765625, -2.7734375, -2.599365234375, -2.42529296875, -2.251220703125, -2.0771484375, -1.903076171875, -1.72900390625, -1.554931640625, -1.380859375, -1.206787109375, -1.03271484375, -0.858642578125, -0.6845703125, -0.510498046875, -0.33642578125, -0.162353515625, 0.01171875, 0.185791015625, 0.35986328125, 0.533935546875, 0.7080078125, 0.882080078125, 1.05615234375, 1.230224609375, 1.404296875, 1.578369140625, 1.75244140625, 1.926513671875, 2.1005859375, 2.274658203125, 2.44873046875, 2.622802734375, 2.796875, 2.970947265625, 3.14501953125, 3.319091796875, 3.4931640625, 3.667236328125, 3.84130859375, 4.015380859375, 4.189453125, 4.363525390625, 4.53759765625, 4.711669921875, 4.8857421875, 5.059814453125, 5.23388671875, 5.407958984375, 5.58203125]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 6.0, 8.0, 8.0, 14.0, 22.0, 30.0, 54.0, 76.0, 111.0, 155.0, 259.0, 401.0, 664.0, 1092.0, 1645.0, 2718.0, 4228.0, 6792.0, 10954.0, 17249.0, 26937.0, 42072.0, 64359.0, 93989.0, 127659.0, 1160977.0, 182580.0, 115752.0, 82616.0, 55603.0, 35934.0, 23127.0, 14539.0, 9109.0, 5673.0, 3580.0, 2270.0, 1440.0, 885.0, 589.0, 360.0, 219.0, 140.0, 96.0, 56.0, 34.0, 18.0, 14.0, 13.0, 7.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.431396484375, -0.41783905029296875, -0.4042816162109375, -0.39072418212890625, -0.377166748046875, -0.36360931396484375, -0.3500518798828125, -0.33649444580078125, -0.32293701171875, -0.30937957763671875, -0.2958221435546875, -0.28226470947265625, -0.268707275390625, -0.25514984130859375, -0.2415924072265625, -0.22803497314453125, -0.2144775390625, -0.20092010498046875, -0.1873626708984375, -0.17380523681640625, -0.160247802734375, -0.14669036865234375, -0.1331329345703125, -0.11957550048828125, -0.10601806640625, -0.09246063232421875, -0.0789031982421875, -0.06534576416015625, -0.051788330078125, -0.03823089599609375, -0.0246734619140625, -0.01111602783203125, 0.00244140625, 0.01599884033203125, 0.0295562744140625, 0.04311370849609375, 0.056671142578125, 0.07022857666015625, 0.0837860107421875, 0.09734344482421875, 0.11090087890625, 0.12445831298828125, 0.1380157470703125, 0.15157318115234375, 0.165130615234375, 0.17868804931640625, 0.1922454833984375, 0.20580291748046875, 0.2193603515625, 0.23291778564453125, 0.2464752197265625, 0.26003265380859375, 0.273590087890625, 0.28714752197265625, 0.3007049560546875, 0.31426239013671875, 0.32781982421875, 0.34137725830078125, 0.3549346923828125, 0.36849212646484375, 0.382049560546875, 0.39560699462890625, 0.4091644287109375, 0.42272186279296875, 0.436279296875]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 6.0, 6.0, 3.0, 8.0, 7.0, 13.0, 11.0, 16.0, 23.0, 26.0, 39.0, 48.0, 66.0, 87.0, 90.0, 96.0, 101.0, 63.0, 68.0, 47.0, 34.0, 36.0, 19.0, 27.0, 8.0, 10.0, 12.0, 7.0, 7.0, 8.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01265716552734375, -0.012302517890930176, -0.011947870254516602, -0.011593222618103027, -0.011238574981689453, -0.010883927345275879, -0.010529279708862305, -0.01017463207244873, -0.009819984436035156, -0.009465336799621582, -0.009110689163208008, -0.008756041526794434, -0.00840139389038086, -0.008046746253967285, -0.007692098617553711, -0.007337450981140137, -0.0069828033447265625, -0.006628155708312988, -0.006273508071899414, -0.00591886043548584, -0.005564212799072266, -0.005209565162658691, -0.004854917526245117, -0.004500269889831543, -0.004145622253417969, -0.0037909746170043945, -0.0034363269805908203, -0.003081679344177246, -0.002727031707763672, -0.0023723840713500977, -0.0020177364349365234, -0.0016630887985229492, -0.001308441162109375, -0.0009537935256958008, -0.0005991458892822266, -0.00024449825286865234, 0.00011014938354492188, 0.0004647970199584961, 0.0008194446563720703, 0.0011740922927856445, 0.0015287399291992188, 0.001883387565612793, 0.002238035202026367, 0.0025926828384399414, 0.0029473304748535156, 0.00330197811126709, 0.003656625747680664, 0.004011273384094238, 0.0043659210205078125, 0.004720568656921387, 0.005075216293334961, 0.005429863929748535, 0.005784511566162109, 0.006139159202575684, 0.006493806838989258, 0.006848454475402832, 0.007203102111816406, 0.0075577497482299805, 0.007912397384643555, 0.008267045021057129, 0.008621692657470703, 0.008976340293884277, 0.009330987930297852, 0.009685635566711426, 0.010040283203125]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 4.0, 6.0, 5.0, 6.0, 7.0, 9.0, 18.0, 23.0, 25.0, 33.0, 42.0, 57.0, 79.0, 127.0, 159.0, 275.0, 455.0, 915.0, 29463.0, 1011736.0, 3261.0, 703.0, 390.0, 218.0, 161.0, 97.0, 77.0, 43.0, 50.0, 29.0, 24.0, 12.0, 10.0, 10.0, 7.0, 7.0, 1.0, 7.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1566162109375, -0.15108489990234375, -0.1455535888671875, -0.14002227783203125, -0.134490966796875, -0.12895965576171875, -0.1234283447265625, -0.11789703369140625, -0.11236572265625, -0.10683441162109375, -0.1013031005859375, -0.09577178955078125, -0.090240478515625, -0.08470916748046875, -0.0791778564453125, -0.07364654541015625, -0.068115234375, -0.06258392333984375, -0.0570526123046875, -0.05152130126953125, -0.045989990234375, -0.04045867919921875, -0.0349273681640625, -0.02939605712890625, -0.02386474609375, -0.01833343505859375, -0.0128021240234375, -0.00727081298828125, -0.001739501953125, 0.00379180908203125, 0.0093231201171875, 0.01485443115234375, 0.0203857421875, 0.02591705322265625, 0.0314483642578125, 0.03697967529296875, 0.042510986328125, 0.04804229736328125, 0.0535736083984375, 0.05910491943359375, 0.06463623046875, 0.07016754150390625, 0.0756988525390625, 0.08123016357421875, 0.086761474609375, 0.09229278564453125, 0.0978240966796875, 0.10335540771484375, 0.10888671875, 0.11441802978515625, 0.1199493408203125, 0.12548065185546875, 0.131011962890625, 0.13654327392578125, 0.1420745849609375, 0.14760589599609375, 0.15313720703125, 0.15866851806640625, 0.1641998291015625, 0.16973114013671875, 0.175262451171875, 0.18079376220703125, 0.1863250732421875, 0.19185638427734375, 0.1973876953125]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 94.0, 883.0, 35.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09171372652053833, -0.08999724686145782, -0.08828076720237732, -0.08656428009271622, -0.08484780043363571, -0.0831313207745552, -0.0814148336648941, -0.0796983540058136, -0.0779818743467331, -0.07626539468765259, -0.07454891502857208, -0.07283242791891098, -0.07111594825983047, -0.06939946860074997, -0.06768298149108887, -0.06596650183200836, -0.06425002217292786, -0.06253354251384735, -0.06081705912947655, -0.05910057574510574, -0.05738409608602524, -0.05566761642694473, -0.05395113304257393, -0.052234649658203125, -0.05051816999912262, -0.048801690340042114, -0.04708520695567131, -0.04536872357130051, -0.04365224391222, -0.041935764253139496, -0.04021928086876869, -0.03850279748439789, -0.03678631782531738, -0.03506983816623688, -0.033353354781866074, -0.03163687139749527, -0.029920391738414764, -0.02820391021668911, -0.026487428694963455, -0.0247709471732378, -0.023054463788866997, -0.021337982267141342, -0.019621500745415688, -0.017905019223690033, -0.01618853770196438, -0.014472056180238724, -0.01275557465851307, -0.011039093136787415, -0.00932261161506176, -0.007606130093336105, -0.005889648571610451, -0.004173167049884796, -0.0024566855281591415, -0.0007402040064334869, 0.0009762775152921677, 0.0026927590370178223, 0.004409240558743477, 0.0061257220804691315, 0.007842203602194786, 0.00955868512392044, 0.011275166645646095, 0.01299164816737175, 0.014708129689097404, 0.01642461121082306, 0.018141092732548714]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 11.0, 6.0, 13.0, 8.0, 6.0, 23.0, 18.0, 27.0, 28.0, 23.0, 43.0, 58.0, 37.0, 48.0, 58.0, 46.0, 52.0, 58.0, 52.0, 41.0, 65.0, 58.0, 50.0, 31.0, 26.0, 36.0, 25.0, 21.0, 11.0, 5.0, 5.0, 9.0, 2.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005323052406311035, -0.005099687725305557, -0.004876323044300079, -0.0046529583632946014, -0.0044295936822891235, -0.004206229001283646, -0.003982864320278168, -0.00375949963927269, -0.003536134958267212, -0.003312770277261734, -0.003089405596256256, -0.002866040915250778, -0.0026426762342453003, -0.0024193115532398224, -0.0021959468722343445, -0.0019725821912288666, -0.0017492175102233887, -0.0015258528292179108, -0.0013024881482124329, -0.001079123467206955, -0.000855758786201477, -0.0006323941051959991, -0.00040902942419052124, -0.00018566474318504333, 3.769993782043457e-05, 0.0002610646188259125, 0.0004844292998313904, 0.0007077939808368683, 0.0009311586618423462, 0.001154523342847824, 0.001377888023853302, 0.00160125270485878, 0.0018246173858642578, 0.0020479820668697357, 0.0022713467478752136, 0.0024947114288806915, 0.0027180761098861694, 0.0029414407908916473, 0.0031648054718971252, 0.003388170152902603, 0.003611534833908081, 0.003834899514913559, 0.004058264195919037, 0.004281628876924515, 0.004504993557929993, 0.004728358238935471, 0.0049517229199409485, 0.005175087600946426, 0.005398452281951904, 0.005621816962957382, 0.00584518164396286, 0.006068546324968338, 0.006291911005973816, 0.006515275686979294, 0.006738640367984772, 0.00696200504899025, 0.0071853697299957275, 0.0074087344110012054, 0.007632099092006683, 0.007855463773012161, 0.00807882845401764, 0.008302193135023117, 0.008525557816028595, 0.008748922497034073, 0.00897228717803955]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 7.0, 4.0, 2.0, 2.0, 2.0, 6.0, 6.0, 8.0, 11.0, 9.0, 19.0, 15.0, 19.0, 16.0, 23.0, 19.0, 26.0, 17.0, 35.0, 37.0, 36.0, 34.0, 47.0, 49.0, 48.0, 43.0, 50.0, 31.0, 35.0, 40.0, 31.0, 31.0, 29.0, 38.0, 30.0, 27.0, 13.0, 19.0, 17.0, 12.0, 15.0, 14.0, 7.0, 10.0, 3.0, 6.0, 6.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.1328125, -7.8729248046875, -7.613037109375, -7.3531494140625, -7.09326171875, -6.8333740234375, -6.573486328125, -6.3135986328125, -6.0537109375, -5.7938232421875, -5.533935546875, -5.2740478515625, -5.01416015625, -4.7542724609375, -4.494384765625, -4.2344970703125, -3.974609375, -3.7147216796875, -3.454833984375, -3.1949462890625, -2.93505859375, -2.6751708984375, -2.415283203125, -2.1553955078125, -1.8955078125, -1.6356201171875, -1.375732421875, -1.1158447265625, -0.85595703125, -0.5960693359375, -0.336181640625, -0.0762939453125, 0.18359375, 0.4434814453125, 0.703369140625, 0.9632568359375, 1.22314453125, 1.4830322265625, 1.742919921875, 2.0028076171875, 2.2626953125, 2.5225830078125, 2.782470703125, 3.0423583984375, 3.30224609375, 3.5621337890625, 3.822021484375, 4.0819091796875, 4.341796875, 4.6016845703125, 4.861572265625, 5.1214599609375, 5.38134765625, 5.6412353515625, 5.901123046875, 6.1610107421875, 6.4208984375, 6.6807861328125, 6.940673828125, 7.2005615234375, 7.46044921875, 7.7203369140625, 7.980224609375, 8.2401123046875, 8.5]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 0.0, 4.0, 9.0, 2.0, 9.0, 8.0, 7.0, 13.0, 16.0, 17.0, 20.0, 31.0, 39.0, 48.0, 73.0, 106.0, 140.0, 187.0, 204.0, 357.0, 483.0, 777.0, 1119.0, 1955.0, 4183.0, 11665.0, 42597.0, 226110.0, 588922.0, 125876.0, 27205.0, 8241.0, 3244.0, 1675.0, 932.0, 658.0, 448.0, 330.0, 211.0, 163.0, 104.0, 97.0, 61.0, 50.0, 42.0, 21.0, 34.0, 20.0, 10.0, 14.0, 8.0, 7.0, 2.0, 5.0, 2.0, 1.0, 4.0, 0.0, 2.0, 1.0], "bins": [-13.6796875, -13.2567138671875, -12.833740234375, -12.4107666015625, -11.98779296875, -11.5648193359375, -11.141845703125, -10.7188720703125, -10.2958984375, -9.8729248046875, -9.449951171875, -9.0269775390625, -8.60400390625, -8.1810302734375, -7.758056640625, -7.3350830078125, -6.912109375, -6.4891357421875, -6.066162109375, -5.6431884765625, -5.22021484375, -4.7972412109375, -4.374267578125, -3.9512939453125, -3.5283203125, -3.1053466796875, -2.682373046875, -2.2593994140625, -1.83642578125, -1.4134521484375, -0.990478515625, -0.5675048828125, -0.14453125, 0.2784423828125, 0.701416015625, 1.1243896484375, 1.54736328125, 1.9703369140625, 2.393310546875, 2.8162841796875, 3.2392578125, 3.6622314453125, 4.085205078125, 4.5081787109375, 4.93115234375, 5.3541259765625, 5.777099609375, 6.2000732421875, 6.623046875, 7.0460205078125, 7.468994140625, 7.8919677734375, 8.31494140625, 8.7379150390625, 9.160888671875, 9.5838623046875, 10.0068359375, 10.4298095703125, 10.852783203125, 11.2757568359375, 11.69873046875, 12.1217041015625, 12.544677734375, 12.9676513671875, 13.390625]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 6.0, 5.0, 5.0, 12.0, 13.0, 17.0, 13.0, 21.0, 29.0, 34.0, 31.0, 44.0, 55.0, 60.0, 104.0, 322.0, 1701.0, 178.0, 81.0, 45.0, 56.0, 40.0, 34.0, 38.0, 23.0, 15.0, 10.0, 10.0, 12.0, 6.0, 5.0, 3.0, 9.0, 4.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.859375, -27.991943359375, -27.12451171875, -26.257080078125, -25.3896484375, -24.522216796875, -23.65478515625, -22.787353515625, -21.919921875, -21.052490234375, -20.18505859375, -19.317626953125, -18.4501953125, -17.582763671875, -16.71533203125, -15.847900390625, -14.98046875, -14.113037109375, -13.24560546875, -12.378173828125, -11.5107421875, -10.643310546875, -9.77587890625, -8.908447265625, -8.041015625, -7.173583984375, -6.30615234375, -5.438720703125, -4.5712890625, -3.703857421875, -2.83642578125, -1.968994140625, -1.1015625, -0.234130859375, 0.63330078125, 1.500732421875, 2.3681640625, 3.235595703125, 4.10302734375, 4.970458984375, 5.837890625, 6.705322265625, 7.57275390625, 8.440185546875, 9.3076171875, 10.175048828125, 11.04248046875, 11.909912109375, 12.77734375, 13.644775390625, 14.51220703125, 15.379638671875, 16.2470703125, 17.114501953125, 17.98193359375, 18.849365234375, 19.716796875, 20.584228515625, 21.45166015625, 22.319091796875, 23.1865234375, 24.053955078125, 24.92138671875, 25.788818359375, 26.65625]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 5.0, 2.0, 5.0, 4.0, 12.0, 12.0, 9.0, 17.0, 21.0, 31.0, 57.0, 95.0, 129.0, 217.0, 482.0, 1201.0, 185061.0, 2955607.0, 1473.0, 540.0, 293.0, 158.0, 83.0, 57.0, 27.0, 26.0, 27.0, 12.0, 9.0, 12.0, 6.0, 4.0, 1.0, 7.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.125, -66.7490234375, -64.373046875, -61.9970703125, -59.62109375, -57.2451171875, -54.869140625, -52.4931640625, -50.1171875, -47.7412109375, -45.365234375, -42.9892578125, -40.61328125, -38.2373046875, -35.861328125, -33.4853515625, -31.109375, -28.7333984375, -26.357421875, -23.9814453125, -21.60546875, -19.2294921875, -16.853515625, -14.4775390625, -12.1015625, -9.7255859375, -7.349609375, -4.9736328125, -2.59765625, -0.2216796875, 2.154296875, 4.5302734375, 6.90625, 9.2822265625, 11.658203125, 14.0341796875, 16.41015625, 18.7861328125, 21.162109375, 23.5380859375, 25.9140625, 28.2900390625, 30.666015625, 33.0419921875, 35.41796875, 37.7939453125, 40.169921875, 42.5458984375, 44.921875, 47.2978515625, 49.673828125, 52.0498046875, 54.42578125, 56.8017578125, 59.177734375, 61.5537109375, 63.9296875, 66.3056640625, 68.681640625, 71.0576171875, 73.43359375, 75.8095703125, 78.185546875, 80.5615234375, 82.9375]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 6.0, 18.0, 31.0, 74.0, 142.0, 220.0, 212.0, 142.0, 90.0, 48.0, 18.0, 6.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.91883850097656, -46.516788482666016, -45.114742279052734, -43.71269226074219, -42.310646057128906, -40.90859603881836, -39.50654602050781, -38.10449981689453, -36.70245361328125, -35.3004035949707, -33.89835739135742, -32.496307373046875, -31.094261169433594, -29.692211151123047, -28.290163040161133, -26.88811492919922, -25.486064910888672, -24.084016799926758, -22.681968688964844, -21.279918670654297, -19.877872467041016, -18.47582244873047, -17.073774337768555, -15.67172622680664, -14.269678115844727, -12.867630004882812, -11.465581893920898, -10.063532829284668, -8.661484718322754, -7.25943660736084, -5.857387542724609, -4.455339431762695, -3.053295135498047, -1.6512467861175537, -0.24919843673706055, 1.1528501510620117, 2.554898262023926, 3.95694637298584, 5.35899543762207, 6.761043548583984, 8.163091659545898, 9.565139770507812, 10.967187881469727, 12.369236946105957, 13.771285057067871, 15.173333168029785, 16.575382232666016, 17.97743034362793, 19.379478454589844, 20.781526565551758, 22.183574676513672, 23.58562469482422, 24.9876708984375, 26.389720916748047, 27.79176902770996, 29.193817138671875, 30.59586524963379, 31.997913360595703, 33.39996337890625, 34.80200958251953, 36.20405960083008, 37.60610580444336, 39.008155822753906, 40.41020202636719, 41.812252044677734]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 6.0, 5.0, 3.0, 6.0, 9.0, 4.0, 7.0, 17.0, 11.0, 18.0, 20.0, 14.0, 30.0, 33.0, 23.0, 33.0, 32.0, 39.0, 39.0, 40.0, 52.0, 37.0, 44.0, 49.0, 48.0, 34.0, 33.0, 38.0, 41.0, 30.0, 28.0, 33.0, 21.0, 26.0, 20.0, 12.0, 20.0, 14.0, 11.0, 3.0, 5.0, 4.0, 4.0, 5.0, 1.0, 4.0, 2.0, 0.0, 3.0, 0.0, 2.0], "bins": [-53.2913818359375, -51.778995513916016, -50.26660919189453, -48.75422286987305, -47.24183654785156, -45.72945022583008, -44.217063903808594, -42.704681396484375, -41.192291259765625, -39.67990493774414, -38.167518615722656, -36.65513229370117, -35.14274597167969, -33.6303596496582, -32.11797332763672, -30.605588912963867, -29.093204498291016, -27.58081817626953, -26.068431854248047, -24.556045532226562, -23.043659210205078, -21.531272888183594, -20.018888473510742, -18.506502151489258, -16.994115829467773, -15.481729507446289, -13.969343185424805, -12.456957817077637, -10.944571495056152, -9.432185173034668, -7.9197998046875, -6.407413482666016, -4.895027160644531, -3.382641077041626, -1.8702549934387207, -0.35786914825439453, 1.1545171737670898, 2.666903495788574, 4.179288864135742, 5.691675186157227, 7.204061508178711, 8.716447830200195, 10.22883415222168, 11.741219520568848, 13.253605842590332, 14.765992164611816, 16.278377532958984, 17.79076385498047, 19.303150177001953, 20.815536499023438, 22.327922821044922, 23.840309143066406, 25.35269546508789, 26.865081787109375, 28.377466201782227, 29.88985252380371, 31.402238845825195, 32.91462326049805, 34.42700958251953, 35.939395904541016, 37.4517822265625, 38.964168548583984, 40.47655487060547, 41.98894119262695, 43.50132751464844]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 5.0, 3.0, 3.0, 2.0, 3.0, 4.0, 1.0, 2.0, 10.0, 7.0, 8.0, 7.0, 9.0, 14.0, 15.0, 21.0, 17.0, 23.0, 21.0, 25.0, 21.0, 29.0, 23.0, 28.0, 29.0, 40.0, 43.0, 40.0, 39.0, 54.0, 40.0, 29.0, 39.0, 36.0, 31.0, 35.0, 30.0, 29.0, 31.0, 19.0, 28.0, 21.0, 17.0, 6.0, 8.0, 15.0, 11.0, 6.0, 8.0, 8.0, 7.0, 3.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0], "bins": [-8.78125, -8.50732421875, -8.2333984375, -7.95947265625, -7.685546875, -7.41162109375, -7.1376953125, -6.86376953125, -6.58984375, -6.31591796875, -6.0419921875, -5.76806640625, -5.494140625, -5.22021484375, -4.9462890625, -4.67236328125, -4.3984375, -4.12451171875, -3.8505859375, -3.57666015625, -3.302734375, -3.02880859375, -2.7548828125, -2.48095703125, -2.20703125, -1.93310546875, -1.6591796875, -1.38525390625, -1.111328125, -0.83740234375, -0.5634765625, -0.28955078125, -0.015625, 0.25830078125, 0.5322265625, 0.80615234375, 1.080078125, 1.35400390625, 1.6279296875, 1.90185546875, 2.17578125, 2.44970703125, 2.7236328125, 2.99755859375, 3.271484375, 3.54541015625, 3.8193359375, 4.09326171875, 4.3671875, 4.64111328125, 4.9150390625, 5.18896484375, 5.462890625, 5.73681640625, 6.0107421875, 6.28466796875, 6.55859375, 6.83251953125, 7.1064453125, 7.38037109375, 7.654296875, 7.92822265625, 8.2021484375, 8.47607421875, 8.75]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 8.0, 5.0, 2.0, 10.0, 7.0, 12.0, 17.0, 23.0, 33.0, 39.0, 66.0, 78.0, 118.0, 144.0, 189.0, 289.0, 374.0, 555.0, 933.0, 2130.0, 14457.0, 1092811.0, 3034865.0, 40524.0, 3216.0, 1170.0, 663.0, 456.0, 278.0, 217.0, 166.0, 133.0, 82.0, 63.0, 41.0, 26.0, 19.0, 27.0, 13.0, 9.0, 8.0, 4.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-55.78125, -53.99072265625, -52.2001953125, -50.40966796875, -48.619140625, -46.82861328125, -45.0380859375, -43.24755859375, -41.45703125, -39.66650390625, -37.8759765625, -36.08544921875, -34.294921875, -32.50439453125, -30.7138671875, -28.92333984375, -27.1328125, -25.34228515625, -23.5517578125, -21.76123046875, -19.970703125, -18.18017578125, -16.3896484375, -14.59912109375, -12.80859375, -11.01806640625, -9.2275390625, -7.43701171875, -5.646484375, -3.85595703125, -2.0654296875, -0.27490234375, 1.515625, 3.30615234375, 5.0966796875, 6.88720703125, 8.677734375, 10.46826171875, 12.2587890625, 14.04931640625, 15.83984375, 17.63037109375, 19.4208984375, 21.21142578125, 23.001953125, 24.79248046875, 26.5830078125, 28.37353515625, 30.1640625, 31.95458984375, 33.7451171875, 35.53564453125, 37.326171875, 39.11669921875, 40.9072265625, 42.69775390625, 44.48828125, 46.27880859375, 48.0693359375, 49.85986328125, 51.650390625, 53.44091796875, 55.2314453125, 57.02197265625, 58.8125]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 8.0, 11.0, 22.0, 28.0, 31.0, 61.0, 84.0, 130.0, 202.0, 334.0, 542.0, 673.0, 620.0, 439.0, 304.0, 205.0, 135.0, 91.0, 46.0, 39.0, 17.0, 18.0, 11.0, 13.0, 7.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-29.265625, -28.5667724609375, -27.867919921875, -27.1690673828125, -26.47021484375, -25.7713623046875, -25.072509765625, -24.3736572265625, -23.6748046875, -22.9759521484375, -22.277099609375, -21.5782470703125, -20.87939453125, -20.1805419921875, -19.481689453125, -18.7828369140625, -18.083984375, -17.3851318359375, -16.686279296875, -15.9874267578125, -15.28857421875, -14.5897216796875, -13.890869140625, -13.1920166015625, -12.4931640625, -11.7943115234375, -11.095458984375, -10.3966064453125, -9.69775390625, -8.9989013671875, -8.300048828125, -7.6011962890625, -6.90234375, -6.2034912109375, -5.504638671875, -4.8057861328125, -4.10693359375, -3.4080810546875, -2.709228515625, -2.0103759765625, -1.3115234375, -0.6126708984375, 0.086181640625, 0.7850341796875, 1.48388671875, 2.1827392578125, 2.881591796875, 3.5804443359375, 4.279296875, 4.9781494140625, 5.677001953125, 6.3758544921875, 7.07470703125, 7.7735595703125, 8.472412109375, 9.1712646484375, 9.8701171875, 10.5689697265625, 11.267822265625, 11.9666748046875, 12.66552734375, 13.3643798828125, 14.063232421875, 14.7620849609375, 15.4609375]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 6.0, 7.0, 6.0, 9.0, 10.0, 9.0, 32.0, 26.0, 56.0, 40.0, 84.0, 125.0, 229.0, 377.0, 843.0, 1739.0, 4419.0, 13050.0, 50213.0, 269913.0, 2048250.0, 1545099.0, 202154.0, 39776.0, 11033.0, 3628.0, 1548.0, 706.0, 334.0, 171.0, 120.0, 74.0, 49.0, 29.0, 29.0, 21.0, 20.0, 12.0, 8.0, 7.0, 6.0, 5.0, 3.0, 3.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.0, -16.4501953125, -15.900390625, -15.3505859375, -14.80078125, -14.2509765625, -13.701171875, -13.1513671875, -12.6015625, -12.0517578125, -11.501953125, -10.9521484375, -10.40234375, -9.8525390625, -9.302734375, -8.7529296875, -8.203125, -7.6533203125, -7.103515625, -6.5537109375, -6.00390625, -5.4541015625, -4.904296875, -4.3544921875, -3.8046875, -3.2548828125, -2.705078125, -2.1552734375, -1.60546875, -1.0556640625, -0.505859375, 0.0439453125, 0.59375, 1.1435546875, 1.693359375, 2.2431640625, 2.79296875, 3.3427734375, 3.892578125, 4.4423828125, 4.9921875, 5.5419921875, 6.091796875, 6.6416015625, 7.19140625, 7.7412109375, 8.291015625, 8.8408203125, 9.390625, 9.9404296875, 10.490234375, 11.0400390625, 11.58984375, 12.1396484375, 12.689453125, 13.2392578125, 13.7890625, 14.3388671875, 14.888671875, 15.4384765625, 15.98828125, 16.5380859375, 17.087890625, 17.6376953125, 18.1875]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 3.0, 2.0, 7.0, 6.0, 8.0, 18.0, 12.0, 19.0, 18.0, 25.0, 34.0, 34.0, 34.0, 56.0, 56.0, 63.0, 56.0, 54.0, 65.0, 55.0, 56.0, 38.0, 46.0, 43.0, 37.0, 31.0, 25.0, 16.0, 26.0, 8.0, 14.0, 7.0, 9.0, 8.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-65.71598815917969, -63.41459655761719, -61.11320495605469, -58.81181335449219, -56.51042175292969, -54.20903015136719, -51.90763473510742, -49.60624313354492, -47.30485153198242, -45.00345993041992, -42.70206832885742, -40.40067672729492, -38.099281311035156, -35.797889709472656, -33.496498107910156, -31.195106506347656, -28.893714904785156, -26.592323303222656, -24.290931701660156, -21.989538192749023, -19.688146591186523, -17.386754989624023, -15.085362434387207, -12.78396987915039, -10.48257827758789, -8.18118667602539, -5.879794120788574, -3.578402042388916, -1.2770099639892578, 1.0243816375732422, 3.3257741928100586, 5.627166748046875, 7.928565979003906, 10.229957580566406, 12.531350135803223, 14.832742691040039, 17.13413429260254, 19.43552589416504, 21.736919403076172, 24.038311004638672, 26.339702606201172, 28.641094207763672, 30.942485809326172, 33.24387741088867, 35.54527282714844, 37.84666442871094, 40.14805603027344, 42.44944763183594, 44.75083923339844, 47.05223083496094, 49.35362243652344, 51.65501403808594, 53.95640563964844, 56.25779724121094, 58.5591926574707, 60.8605842590332, 63.1619758605957, 65.46337127685547, 67.76476287841797, 70.06615447998047, 72.36754608154297, 74.66893768310547, 76.97032928466797, 79.27172088623047, 81.57311248779297]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 3.0, 2.0, 8.0, 4.0, 4.0, 11.0, 17.0, 6.0, 10.0, 11.0, 23.0, 16.0, 25.0, 35.0, 39.0, 21.0, 31.0, 50.0, 30.0, 39.0, 43.0, 34.0, 59.0, 49.0, 39.0, 41.0, 37.0, 43.0, 30.0, 35.0, 34.0, 23.0, 26.0, 18.0, 19.0, 30.0, 14.0, 9.0, 10.0, 8.0, 5.0, 8.0, 6.0, 0.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.457855224609375, -53.38108825683594, -51.3043212890625, -49.22755432128906, -47.15079116821289, -45.07402420043945, -42.997257232666016, -40.92049026489258, -38.843727111816406, -36.76696014404297, -34.69019317626953, -32.613426208496094, -30.536663055419922, -28.459896087646484, -26.383129119873047, -24.30636215209961, -22.229595184326172, -20.152828216552734, -18.07606315612793, -15.999296188354492, -13.922530174255371, -11.84576416015625, -9.768997192382812, -7.692231178283691, -5.61546516418457, -3.53869891166687, -1.46193265914917, 0.6148338317871094, 2.6915998458862305, 4.768365859985352, 6.845132827758789, 8.92189884185791, 10.998664855957031, 13.075430870056152, 15.152196884155273, 17.22896385192871, 19.305728912353516, 21.382495880126953, 23.45926284790039, 25.536029815673828, 27.612794876098633, 29.68956184387207, 31.766326904296875, 33.84309387207031, 35.91986083984375, 37.99662780761719, 40.073394775390625, 42.1501579284668, 44.226924896240234, 46.30369186401367, 48.38045883178711, 50.45722198486328, 52.53398895263672, 54.610755920410156, 56.687522888183594, 58.76428985595703, 60.84105682373047, 62.917823791503906, 64.99459075927734, 67.07135772705078, 69.14812469482422, 71.22488403320312, 73.30165100097656, 75.37841796875, 77.45518493652344]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 7.0, 6.0, 10.0, 8.0, 9.0, 12.0, 16.0, 16.0, 25.0, 25.0, 29.0, 39.0, 41.0, 31.0, 36.0, 48.0, 45.0, 40.0, 41.0, 61.0, 44.0, 46.0, 50.0, 48.0, 30.0, 43.0, 39.0, 22.0, 19.0, 24.0, 25.0, 18.0, 14.0, 8.0, 7.0, 5.0, 2.0, 8.0, 6.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-105.25, -101.341796875, -97.43359375, -93.525390625, -89.6171875, -85.708984375, -81.80078125, -77.892578125, -73.984375, -70.076171875, -66.16796875, -62.259765625, -58.3515625, -54.443359375, -50.53515625, -46.626953125, -42.71875, -38.810546875, -34.90234375, -30.994140625, -27.0859375, -23.177734375, -19.26953125, -15.361328125, -11.453125, -7.544921875, -3.63671875, 0.271484375, 4.1796875, 8.087890625, 11.99609375, 15.904296875, 19.8125, 23.720703125, 27.62890625, 31.537109375, 35.4453125, 39.353515625, 43.26171875, 47.169921875, 51.078125, 54.986328125, 58.89453125, 62.802734375, 66.7109375, 70.619140625, 74.52734375, 78.435546875, 82.34375, 86.251953125, 90.16015625, 94.068359375, 97.9765625, 101.884765625, 105.79296875, 109.701171875, 113.609375, 117.517578125, 121.42578125, 125.333984375, 129.2421875, 133.150390625, 137.05859375, 140.966796875, 144.875]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 10.0, 7.0, 8.0, 11.0, 22.0, 40.0, 45.0, 62.0, 93.0, 135.0, 207.0, 331.0, 447.0, 705.0, 1167.0, 1666.0, 2651.0, 4014.0, 6151.0, 9403.0, 14552.0, 22584.0, 34995.0, 54011.0, 80974.0, 114739.0, 148466.0, 155678.0, 126948.0, 91477.0, 62187.0, 40349.0, 26237.0, 16736.0, 10914.0, 7128.0, 4640.0, 2957.0, 1907.0, 1325.0, 882.0, 605.0, 324.0, 266.0, 168.0, 95.0, 92.0, 53.0, 33.0, 22.0, 14.0, 12.0, 8.0, 7.0, 4.0, 4.0, 0.0, 0.0, 3.0], "bins": [-6.36328125, -6.16546630859375, -5.9676513671875, -5.76983642578125, -5.572021484375, -5.37420654296875, -5.1763916015625, -4.97857666015625, -4.78076171875, -4.58294677734375, -4.3851318359375, -4.18731689453125, -3.989501953125, -3.79168701171875, -3.5938720703125, -3.39605712890625, -3.1982421875, -3.00042724609375, -2.8026123046875, -2.60479736328125, -2.406982421875, -2.20916748046875, -2.0113525390625, -1.81353759765625, -1.61572265625, -1.41790771484375, -1.2200927734375, -1.02227783203125, -0.824462890625, -0.62664794921875, -0.4288330078125, -0.23101806640625, -0.033203125, 0.16461181640625, 0.3624267578125, 0.56024169921875, 0.758056640625, 0.95587158203125, 1.1536865234375, 1.35150146484375, 1.54931640625, 1.74713134765625, 1.9449462890625, 2.14276123046875, 2.340576171875, 2.53839111328125, 2.7362060546875, 2.93402099609375, 3.1318359375, 3.32965087890625, 3.5274658203125, 3.72528076171875, 3.923095703125, 4.12091064453125, 4.3187255859375, 4.51654052734375, 4.71435546875, 4.91217041015625, 5.1099853515625, 5.30780029296875, 5.505615234375, 5.70343017578125, 5.9012451171875, 6.09906005859375, 6.296875]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 2.0, 8.0, 12.0, 9.0, 9.0, 7.0, 10.0, 12.0, 14.0, 24.0, 21.0, 20.0, 26.0, 22.0, 25.0, 31.0, 35.0, 38.0, 39.0, 26.0, 34.0, 30.0, 29.0, 1061.0, 41.0, 44.0, 34.0, 25.0, 35.0, 39.0, 22.0, 38.0, 27.0, 24.0, 23.0, 23.0, 10.0, 9.0, 19.0, 11.0, 8.0, 11.0, 6.0, 6.0, 8.0, 5.0, 6.0, 5.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-59.03125, -57.1435546875, -55.255859375, -53.3681640625, -51.48046875, -49.5927734375, -47.705078125, -45.8173828125, -43.9296875, -42.0419921875, -40.154296875, -38.2666015625, -36.37890625, -34.4912109375, -32.603515625, -30.7158203125, -28.828125, -26.9404296875, -25.052734375, -23.1650390625, -21.27734375, -19.3896484375, -17.501953125, -15.6142578125, -13.7265625, -11.8388671875, -9.951171875, -8.0634765625, -6.17578125, -4.2880859375, -2.400390625, -0.5126953125, 1.375, 3.2626953125, 5.150390625, 7.0380859375, 8.92578125, 10.8134765625, 12.701171875, 14.5888671875, 16.4765625, 18.3642578125, 20.251953125, 22.1396484375, 24.02734375, 25.9150390625, 27.802734375, 29.6904296875, 31.578125, 33.4658203125, 35.353515625, 37.2412109375, 39.12890625, 41.0166015625, 42.904296875, 44.7919921875, 46.6796875, 48.5673828125, 50.455078125, 52.3427734375, 54.23046875, 56.1181640625, 58.005859375, 59.8935546875, 61.78125]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 6.0, 3.0, 10.0, 16.0, 18.0, 28.0, 52.0, 82.0, 99.0, 195.0, 259.0, 375.0, 627.0, 965.0, 1642.0, 2425.0, 3828.0, 6160.0, 9830.0, 15452.0, 24417.0, 37814.0, 56982.0, 84487.0, 117598.0, 285885.0, 1056751.0, 123947.0, 91366.0, 62040.0, 41091.0, 26742.0, 16749.0, 10733.0, 6769.0, 4201.0, 2674.0, 1745.0, 1056.0, 715.0, 458.0, 298.0, 210.0, 111.0, 69.0, 50.0, 38.0, 29.0, 12.0, 10.0, 6.0, 7.0, 2.0, 3.0, 2.0, 1.0, 2.0], "bins": [-5.6484375, -5.477783203125, -5.30712890625, -5.136474609375, -4.9658203125, -4.795166015625, -4.62451171875, -4.453857421875, -4.283203125, -4.112548828125, -3.94189453125, -3.771240234375, -3.6005859375, -3.429931640625, -3.25927734375, -3.088623046875, -2.91796875, -2.747314453125, -2.57666015625, -2.406005859375, -2.2353515625, -2.064697265625, -1.89404296875, -1.723388671875, -1.552734375, -1.382080078125, -1.21142578125, -1.040771484375, -0.8701171875, -0.699462890625, -0.52880859375, -0.358154296875, -0.1875, -0.016845703125, 0.15380859375, 0.324462890625, 0.4951171875, 0.665771484375, 0.83642578125, 1.007080078125, 1.177734375, 1.348388671875, 1.51904296875, 1.689697265625, 1.8603515625, 2.031005859375, 2.20166015625, 2.372314453125, 2.54296875, 2.713623046875, 2.88427734375, 3.054931640625, 3.2255859375, 3.396240234375, 3.56689453125, 3.737548828125, 3.908203125, 4.078857421875, 4.24951171875, 4.420166015625, 4.5908203125, 4.761474609375, 4.93212890625, 5.102783203125, 5.2734375]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 1.0, 1.0, 9.0, 5.0, 14.0, 11.0, 16.0, 19.0, 23.0, 37.0, 30.0, 50.0, 52.0, 91.0, 85.0, 93.0, 84.0, 70.0, 55.0, 50.0, 38.0, 33.0, 22.0, 18.0, 16.0, 16.0, 16.0, 10.0, 12.0, 2.0, 5.0, 3.0, 5.0, 4.0, 2.0, 3.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1236572265625, -0.11906051635742188, -0.11446380615234375, -0.10986709594726562, -0.1052703857421875, -0.10067367553710938, -0.09607696533203125, -0.09148025512695312, -0.086883544921875, -0.08228683471679688, -0.07769012451171875, -0.07309341430664062, -0.0684967041015625, -0.06389999389648438, -0.05930328369140625, -0.054706573486328125, -0.05010986328125, -0.045513153076171875, -0.04091644287109375, -0.036319732666015625, -0.0317230224609375, -0.027126312255859375, -0.02252960205078125, -0.017932891845703125, -0.013336181640625, -0.008739471435546875, -0.00414276123046875, 0.000453948974609375, 0.0050506591796875, 0.009647369384765625, 0.01424407958984375, 0.018840789794921875, 0.0234375, 0.028034210205078125, 0.03263092041015625, 0.037227630615234375, 0.0418243408203125, 0.046421051025390625, 0.05101776123046875, 0.055614471435546875, 0.060211181640625, 0.06480789184570312, 0.06940460205078125, 0.07400131225585938, 0.0785980224609375, 0.08319473266601562, 0.08779144287109375, 0.09238815307617188, 0.09698486328125, 0.10158157348632812, 0.10617828369140625, 0.11077499389648438, 0.1153717041015625, 0.11996841430664062, 0.12456512451171875, 0.12916183471679688, 0.133758544921875, 0.13835525512695312, 0.14295196533203125, 0.14754867553710938, 0.1521453857421875, 0.15674209594726562, 0.16133880615234375, 0.16593551635742188, 0.1705322265625]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 10.0, 5.0, 8.0, 24.0, 27.0, 45.0, 59.0, 81.0, 119.0, 212.0, 329.0, 551.0, 1055.0, 2157.0, 4567.0, 10691.0, 28856.0, 98780.0, 475260.0, 319603.0, 68197.0, 21872.0, 8474.0, 3700.0, 1737.0, 920.0, 505.0, 255.0, 156.0, 106.0, 73.0, 44.0, 26.0, 15.0, 8.0, 9.0, 8.0, 5.0, 4.0, 0.0, 2.0, 0.0, 4.0, 0.0, 2.0], "bins": [-1.0107421875, -0.9840469360351562, -0.9573516845703125, -0.9306564331054688, -0.903961181640625, -0.8772659301757812, -0.8505706787109375, -0.8238754272460938, -0.79718017578125, -0.7704849243164062, -0.7437896728515625, -0.7170944213867188, -0.690399169921875, -0.6637039184570312, -0.6370086669921875, -0.6103134155273438, -0.5836181640625, -0.5569229125976562, -0.5302276611328125, -0.5035324096679688, -0.476837158203125, -0.45014190673828125, -0.4234466552734375, -0.39675140380859375, -0.37005615234375, -0.34336090087890625, -0.3166656494140625, -0.28997039794921875, -0.263275146484375, -0.23657989501953125, -0.2098846435546875, -0.18318939208984375, -0.156494140625, -0.12979888916015625, -0.1031036376953125, -0.07640838623046875, -0.049713134765625, -0.02301788330078125, 0.0036773681640625, 0.03037261962890625, 0.05706787109375, 0.08376312255859375, 0.1104583740234375, 0.13715362548828125, 0.163848876953125, 0.19054412841796875, 0.2172393798828125, 0.24393463134765625, 0.2706298828125, 0.29732513427734375, 0.3240203857421875, 0.35071563720703125, 0.377410888671875, 0.40410614013671875, 0.4308013916015625, 0.45749664306640625, 0.48419189453125, 0.5108871459960938, 0.5375823974609375, 0.5642776489257812, 0.590972900390625, 0.6176681518554688, 0.6443634033203125, 0.6710586547851562, 0.69775390625]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 0.0, 6.0, 9.0, 14.0, 26.0, 40.0, 61.0, 75.0, 123.0, 144.0, 151.0, 121.0, 98.0, 50.0, 38.0, 21.0, 12.0, 7.0, 3.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25400230288505554, -0.24652716517448425, -0.23905202746391296, -0.23157688975334167, -0.22410175204277039, -0.2166266143321991, -0.2091514617204666, -0.20167632400989532, -0.19420118629932404, -0.18672604858875275, -0.17925091087818146, -0.17177577316761017, -0.16430062055587769, -0.1568254828453064, -0.1493503451347351, -0.14187520742416382, -0.13440006971359253, -0.12692493200302124, -0.11944979429244995, -0.11197464913129807, -0.10449951142072678, -0.09702437371015549, -0.0895492285490036, -0.08207409083843231, -0.07459895312786102, -0.06712381541728973, -0.059648673981428146, -0.05217353254556656, -0.04469839483499527, -0.03722325712442398, -0.029748115688562393, -0.022272974252700806, -0.01479785144329071, -0.007322711870074272, 0.00015242770314216614, 0.007627567276358604, 0.015102706849575043, 0.022577844560146332, 0.03005298599600792, 0.03752812743186951, 0.045003265142440796, 0.052478402853012085, 0.05995354428887367, 0.06742868572473526, 0.07490382343530655, 0.08237896114587784, 0.08985410630702972, 0.09732924401760101, 0.1048043817281723, 0.11227951943874359, 0.11975465714931488, 0.12722979485988617, 0.13470494747161865, 0.14218008518218994, 0.14965522289276123, 0.15713036060333252, 0.1646054983139038, 0.1720806360244751, 0.1795557737350464, 0.18703091144561768, 0.19450604915618896, 0.20198118686676025, 0.20945633947849274, 0.21693147718906403, 0.22440661489963531]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 5.0, 3.0, 3.0, 3.0, 7.0, 4.0, 7.0, 5.0, 7.0, 12.0, 8.0, 14.0, 25.0, 18.0, 31.0, 22.0, 27.0, 26.0, 42.0, 34.0, 39.0, 37.0, 27.0, 40.0, 40.0, 39.0, 39.0, 29.0, 37.0, 44.0, 40.0, 38.0, 33.0, 34.0, 26.0, 13.0, 15.0, 24.0, 22.0, 17.0, 12.0, 14.0, 10.0, 9.0, 7.0, 2.0, 6.0, 2.0, 6.0, 5.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.06296664476394653, -0.06081600859761238, -0.05866537243127823, -0.056514739990234375, -0.05436410382390022, -0.05221346765756607, -0.05006283521652222, -0.047912199050188065, -0.04576156288385391, -0.04361092671751976, -0.04146029055118561, -0.039309658110141754, -0.0371590219438076, -0.03500838577747345, -0.032857753336429596, -0.030707117170095444, -0.02855648100376129, -0.02640584483742714, -0.024255210533738136, -0.022104576230049133, -0.01995394006371498, -0.01780330389738083, -0.015652669593691826, -0.013502034358680248, -0.01135139912366867, -0.009200763888657093, -0.0070501286536455154, -0.004899493418633938, -0.0027488581836223602, -0.0005982229486107826, 0.001552412286400795, 0.0037030475214123726, 0.00585368275642395, 0.008004317991435528, 0.010154953226447105, 0.012305588461458683, 0.01445622369647026, 0.016606859862804413, 0.018757494166493416, 0.02090812847018242, 0.02305876463651657, 0.025209400802850723, 0.027360035106539726, 0.02951066941022873, 0.03166130557656288, 0.033811941742897034, 0.03596257418394089, 0.03811321035027504, 0.04026384651660919, 0.042414482682943344, 0.044565118849277496, 0.04671575129032135, 0.0488663874566555, 0.051017023622989655, 0.05316765606403351, 0.05531829223036766, 0.05746892839670181, 0.059619564563035965, 0.06177020072937012, 0.06392083317041397, 0.06607146561145782, 0.06822210550308228, 0.07037273794412613, 0.07252337783575058, 0.07467401027679443]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 8.0, 6.0, 10.0, 8.0, 9.0, 12.0, 15.0, 16.0, 26.0, 24.0, 30.0, 39.0, 40.0, 32.0, 36.0, 44.0, 49.0, 40.0, 39.0, 60.0, 45.0, 48.0, 51.0, 46.0, 29.0, 46.0, 37.0, 22.0, 20.0, 24.0, 24.0, 19.0, 14.0, 9.0, 6.0, 5.0, 2.0, 8.0, 6.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-105.4375, -101.5244140625, -97.611328125, -93.6982421875, -89.78515625, -85.8720703125, -81.958984375, -78.0458984375, -74.1328125, -70.2197265625, -66.306640625, -62.3935546875, -58.48046875, -54.5673828125, -50.654296875, -46.7412109375, -42.828125, -38.9150390625, -35.001953125, -31.0888671875, -27.17578125, -23.2626953125, -19.349609375, -15.4365234375, -11.5234375, -7.6103515625, -3.697265625, 0.2158203125, 4.12890625, 8.0419921875, 11.955078125, 15.8681640625, 19.78125, 23.6943359375, 27.607421875, 31.5205078125, 35.43359375, 39.3466796875, 43.259765625, 47.1728515625, 51.0859375, 54.9990234375, 58.912109375, 62.8251953125, 66.73828125, 70.6513671875, 74.564453125, 78.4775390625, 82.390625, 86.3037109375, 90.216796875, 94.1298828125, 98.04296875, 101.9560546875, 105.869140625, 109.7822265625, 113.6953125, 117.6083984375, 121.521484375, 125.4345703125, 129.34765625, 133.2607421875, 137.173828125, 141.0869140625, 145.0]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 5.0, 4.0, 7.0, 5.0, 9.0, 17.0, 13.0, 19.0, 31.0, 46.0, 67.0, 109.0, 123.0, 218.0, 321.0, 512.0, 913.0, 1771.0, 3699.0, 8973.0, 28409.0, 126839.0, 501044.0, 288566.0, 59813.0, 15473.0, 5734.0, 2580.0, 1325.0, 740.0, 416.0, 251.0, 169.0, 106.0, 72.0, 50.0, 35.0, 28.0, 14.0, 10.0, 9.0, 9.0, 5.0, 1.0, 0.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.40625, -19.671142578125, -18.93603515625, -18.200927734375, -17.4658203125, -16.730712890625, -15.99560546875, -15.260498046875, -14.525390625, -13.790283203125, -13.05517578125, -12.320068359375, -11.5849609375, -10.849853515625, -10.11474609375, -9.379638671875, -8.64453125, -7.909423828125, -7.17431640625, -6.439208984375, -5.7041015625, -4.968994140625, -4.23388671875, -3.498779296875, -2.763671875, -2.028564453125, -1.29345703125, -0.558349609375, 0.1767578125, 0.911865234375, 1.64697265625, 2.382080078125, 3.1171875, 3.852294921875, 4.58740234375, 5.322509765625, 6.0576171875, 6.792724609375, 7.52783203125, 8.262939453125, 8.998046875, 9.733154296875, 10.46826171875, 11.203369140625, 11.9384765625, 12.673583984375, 13.40869140625, 14.143798828125, 14.87890625, 15.614013671875, 16.34912109375, 17.084228515625, 17.8193359375, 18.554443359375, 19.28955078125, 20.024658203125, 20.759765625, 21.494873046875, 22.22998046875, 22.965087890625, 23.7001953125, 24.435302734375, 25.17041015625, 25.905517578125, 26.640625]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 5.0, 5.0, 4.0, 9.0, 12.0, 14.0, 22.0, 19.0, 32.0, 31.0, 41.0, 46.0, 70.0, 55.0, 78.0, 2076.0, 116.0, 68.0, 70.0, 66.0, 49.0, 47.0, 26.0, 28.0, 14.0, 8.0, 5.0, 9.0, 5.0, 5.0, 7.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-259.75, -251.84375, -243.9375, -236.03125, -228.125, -220.21875, -212.3125, -204.40625, -196.5, -188.59375, -180.6875, -172.78125, -164.875, -156.96875, -149.0625, -141.15625, -133.25, -125.34375, -117.4375, -109.53125, -101.625, -93.71875, -85.8125, -77.90625, -70.0, -62.09375, -54.1875, -46.28125, -38.375, -30.46875, -22.5625, -14.65625, -6.75, 1.15625, 9.0625, 16.96875, 24.875, 32.78125, 40.6875, 48.59375, 56.5, 64.40625, 72.3125, 80.21875, 88.125, 96.03125, 103.9375, 111.84375, 119.75, 127.65625, 135.5625, 143.46875, 151.375, 159.28125, 167.1875, 175.09375, 183.0, 190.90625, 198.8125, 206.71875, 214.625, 222.53125, 230.4375, 238.34375, 246.25]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 6.0, 3.0, 8.0, 13.0, 16.0, 12.0, 16.0, 20.0, 31.0, 40.0, 69.0, 80.0, 110.0, 163.0, 346.0, 577.0, 1211.0, 3801.0, 22786.0, 2628299.0, 463884.0, 18429.0, 3215.0, 1079.0, 542.0, 292.0, 190.0, 142.0, 88.0, 59.0, 41.0, 33.0, 24.0, 16.0, 16.0, 16.0, 8.0, 6.0, 8.0, 2.0, 1.0, 3.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-53.46875, -51.84619140625, -50.2236328125, -48.60107421875, -46.978515625, -45.35595703125, -43.7333984375, -42.11083984375, -40.48828125, -38.86572265625, -37.2431640625, -35.62060546875, -33.998046875, -32.37548828125, -30.7529296875, -29.13037109375, -27.5078125, -25.88525390625, -24.2626953125, -22.64013671875, -21.017578125, -19.39501953125, -17.7724609375, -16.14990234375, -14.52734375, -12.90478515625, -11.2822265625, -9.65966796875, -8.037109375, -6.41455078125, -4.7919921875, -3.16943359375, -1.546875, 0.07568359375, 1.6982421875, 3.32080078125, 4.943359375, 6.56591796875, 8.1884765625, 9.81103515625, 11.43359375, 13.05615234375, 14.6787109375, 16.30126953125, 17.923828125, 19.54638671875, 21.1689453125, 22.79150390625, 24.4140625, 26.03662109375, 27.6591796875, 29.28173828125, 30.904296875, 32.52685546875, 34.1494140625, 35.77197265625, 37.39453125, 39.01708984375, 40.6396484375, 42.26220703125, 43.884765625, 45.50732421875, 47.1298828125, 48.75244140625, 50.375]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 6.0, 4.0, 4.0, 11.0, 24.0, 34.0, 90.0, 204.0, 235.0, 191.0, 100.0, 48.0, 20.0, 18.0, 6.0, 4.0, 5.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-205.1308135986328, -191.84591674804688, -178.56101989746094, -165.276123046875, -151.99124145507812, -138.70632934570312, -125.42144775390625, -112.13655090332031, -98.85165405273438, -85.56675720214844, -72.2818603515625, -58.996971130371094, -45.712074279785156, -32.42717742919922, -19.142288208007812, -5.857391357421875, 7.4275054931640625, 20.712400436401367, 33.99729537963867, 47.282188415527344, 60.56708526611328, 73.85198211669922, 87.13687133789062, 100.42176818847656, 113.7066650390625, 126.99156188964844, 140.27645874023438, 153.56134033203125, 166.84625244140625, 180.13113403320312, 193.41603088378906, 206.700927734375, 219.98583984375, 233.27073669433594, 246.55563354492188, 259.84051513671875, 273.12542724609375, 286.4103088378906, 299.6951904296875, 312.9801025390625, 326.2650146484375, 339.5498962402344, 352.8348083496094, 366.11968994140625, 379.40460205078125, 392.6894836425781, 405.974365234375, 419.25927734375, 432.5441589355469, 445.82904052734375, 459.11395263671875, 472.3988342285156, 485.6837463378906, 498.9686279296875, 512.2535400390625, 525.5384521484375, 538.8233032226562, 552.1082153320312, 565.39306640625, 578.677978515625, 591.962890625, 605.247802734375, 618.5326538085938, 631.8175659179688, 645.1024780273438]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 3.0, 3.0, 5.0, 6.0, 11.0, 7.0, 4.0, 16.0, 13.0, 13.0, 17.0, 17.0, 21.0, 30.0, 37.0, 32.0, 39.0, 36.0, 49.0, 47.0, 36.0, 46.0, 40.0, 42.0, 49.0, 49.0, 32.0, 36.0, 40.0, 29.0, 34.0, 17.0, 27.0, 18.0, 12.0, 13.0, 20.0, 14.0, 11.0, 8.0, 11.0, 0.0, 4.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-182.3821258544922, -175.43370056152344, -168.48526000976562, -161.53683471679688, -154.58839416503906, -147.6399688720703, -140.6915283203125, -133.74310302734375, -126.79467010498047, -119.84623718261719, -112.8978042602539, -105.94937133789062, -99.00094604492188, -92.05250549316406, -85.10408020019531, -78.15564727783203, -71.20721435546875, -64.25878143310547, -57.31034851074219, -50.36191940307617, -43.41348648071289, -36.46505355834961, -29.516624450683594, -22.568191528320312, -15.619758605957031, -8.671326637268066, -1.7228946685791016, 5.225536346435547, 12.173969268798828, 19.12240219116211, 26.070831298828125, 33.019264221191406, 39.967681884765625, 46.916114807128906, 53.86454772949219, 60.8129768371582, 67.76141357421875, 74.7098388671875, 81.65827178955078, 88.60670471191406, 95.55513763427734, 102.50357055664062, 109.4520034790039, 116.40043640136719, 123.34886169433594, 130.29730224609375, 137.2457275390625, 144.19415283203125, 151.14259338378906, 158.0910186767578, 165.03945922851562, 171.98788452148438, 178.9363250732422, 185.88475036621094, 192.83319091796875, 199.7816162109375, 206.73004150390625, 213.678466796875, 220.6269073486328, 227.57533264160156, 234.52377319335938, 241.47219848632812, 248.42062377929688, 255.3690643310547, 262.3175048828125]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 12.0, 15.0, 13.0, 16.0, 30.0, 28.0, 39.0, 45.0, 76.0, 107.0, 131.0, 184.0, 284.0, 364.0, 520.0, 652.0, 910.0, 1040166.0, 1661.0, 853.0, 651.0, 457.0, 365.0, 249.0, 190.0, 153.0, 93.0, 67.0, 55.0, 45.0, 35.0, 15.0, 25.0, 15.0, 9.0, 8.0, 6.0, 7.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.66717529296875, -69.10254669189453, -66.53791809082031, -63.97329330444336, -61.40866470336914, -58.84403610229492, -56.27941131591797, -53.71478271484375, -51.15015411376953, -48.58552551269531, -46.020896911621094, -43.45627212524414, -40.89164352416992, -38.3270149230957, -35.76239013671875, -33.19776153564453, -30.633132934570312, -28.068504333496094, -25.503877639770508, -22.939250946044922, -20.374622344970703, -17.809993743896484, -15.245367050170898, -12.680740356445312, -10.116111755371094, -7.551484107971191, -4.986856460571289, -2.4222288131713867, 0.14239883422851562, 2.707026481628418, 5.27165412902832, 7.836280822753906, 10.400909423828125, 12.965537071228027, 15.53016471862793, 18.094791412353516, 20.659420013427734, 23.224048614501953, 25.78867530822754, 28.353302001953125, 30.917930603027344, 33.48255920410156, 36.04718780517578, 38.611812591552734, 41.17644119262695, 43.74106979370117, 46.305694580078125, 48.870323181152344, 51.43495178222656, 53.99958038330078, 56.564208984375, 59.12883377075195, 61.69346237182617, 64.25808715820312, 66.82271575927734, 69.38734436035156, 71.95197296142578, 74.5166015625, 77.08123016357422, 79.64585876464844, 82.21047973632812, 84.77510833740234, 87.33973693847656, 89.90436553955078, 92.468994140625]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 6.0, 3.0, 4.0, 4.0, 3.0, 3.0, 7.0, 10.0, 22.0, 26.0, 62.0, 219.0, 51459000.0, 3579.0, 81.0, 44.0, 21.0, 19.0, 5.0, 6.0, 7.0, 1.0, 5.0, 4.0, 5.0, 4.0, 1.0, 2.0, 3.0, 8.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4572.0, -4371.81298828125, -4171.6259765625, -3971.43896484375, -3771.251953125, -3571.06494140625, -3370.8779296875, -3170.69091796875, -2970.50390625, -2770.31689453125, -2570.1298828125, -2369.94287109375, -2169.755859375, -1969.56884765625, -1769.3817138671875, -1569.1947021484375, -1369.007568359375, -1168.820556640625, -968.633544921875, -768.4464721679688, -568.2594604492188, -368.07244873046875, -167.8853759765625, 32.3016357421875, 232.4886474609375, 432.6756591796875, 632.8626708984375, 833.0497436523438, 1033.23681640625, 1233.423828125, 1433.61083984375, 1633.7978515625, 1833.98486328125, 2034.171875, 2234.35888671875, 2434.5458984375, 2634.73291015625, 2834.919921875, 3035.10693359375, 3235.2939453125, 3435.48095703125, 3635.66796875, 3835.85498046875, 4036.0419921875, 4236.22900390625, 4436.416015625, 4636.60302734375, 4836.7900390625, 5036.9775390625, 5237.16455078125, 5437.3515625, 5637.53857421875, 5837.7255859375, 6037.91259765625, 6238.099609375, 6438.28662109375, 6638.4736328125, 6838.66064453125, 7038.84765625, 7239.03466796875, 7439.2216796875, 7639.40869140625, 7839.595703125, 8039.78271484375, 8239.9697265625]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 6.0, 3.0, 9.0, 18.0, 21.0, 29.0, 50.0, 80.0, 124.0, 203.0, 288.0, 508.0, 761.0, 1108.0, 1729.0, 2827.0, 4411.0, 6534.0, 10192.0, 15574.0, 23487.0, 36097.0, 54458.0, 81677.0, 122500.0, 176319.0, 246769.0, 333585.0, 808138.0, 3041394.0, 399738.0, 283676.0, 206709.0, 143841.0, 97701.0, 65945.0, 43217.0, 28139.0, 18762.0, 11923.0, 7902.0, 5333.0, 3420.0, 2149.0, 1390.0, 949.0, 642.0, 394.0, 252.0, 170.0, 93.0, 81.0, 52.0, 30.0, 16.0, 12.0, 7.0, 4.0, 5.0, 3.0, 0.0, 1.0], "bins": [-1.9912109375, -1.9274444580078125, -1.863677978515625, -1.7999114990234375, -1.73614501953125, -1.6723785400390625, -1.608612060546875, -1.5448455810546875, -1.4810791015625, -1.4173126220703125, -1.353546142578125, -1.2897796630859375, -1.22601318359375, -1.1622467041015625, -1.098480224609375, -1.0347137451171875, -0.970947265625, -0.9071807861328125, -0.843414306640625, -0.7796478271484375, -0.71588134765625, -0.6521148681640625, -0.588348388671875, -0.5245819091796875, -0.4608154296875, -0.3970489501953125, -0.333282470703125, -0.2695159912109375, -0.20574951171875, -0.1419830322265625, -0.078216552734375, -0.0144500732421875, 0.04931640625, 0.1130828857421875, 0.176849365234375, 0.2406158447265625, 0.30438232421875, 0.3681488037109375, 0.431915283203125, 0.4956817626953125, 0.5594482421875, 0.6232147216796875, 0.686981201171875, 0.7507476806640625, 0.81451416015625, 0.8782806396484375, 0.942047119140625, 1.0058135986328125, 1.069580078125, 1.1333465576171875, 1.197113037109375, 1.2608795166015625, 1.32464599609375, 1.3884124755859375, 1.452178955078125, 1.5159454345703125, 1.5797119140625, 1.6434783935546875, 1.707244873046875, 1.7710113525390625, 1.83477783203125, 1.8985443115234375, 1.962310791015625, 2.0260772705078125, 2.08984375]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 4.0, 4.0, 11.0, 11.0, 10.0, 9.0, 18.0, 19.0, 21.0, 33.0, 27.0, 41.0, 32.0, 45.0, 42.0, 39.0, 35.0, 34.0, 41.0, 945.0, 180.0, 38.0, 41.0, 33.0, 35.0, 29.0, 29.0, 29.0, 37.0, 24.0, 22.0, 20.0, 14.0, 12.0, 12.0, 9.0, 10.0, 10.0, 5.0, 5.0, 3.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.265625, -29.247802734375, -28.22998046875, -27.212158203125, -26.1943359375, -25.176513671875, -24.15869140625, -23.140869140625, -22.123046875, -21.105224609375, -20.08740234375, -19.069580078125, -18.0517578125, -17.033935546875, -16.01611328125, -14.998291015625, -13.98046875, -12.962646484375, -11.94482421875, -10.927001953125, -9.9091796875, -8.891357421875, -7.87353515625, -6.855712890625, -5.837890625, -4.820068359375, -3.80224609375, -2.784423828125, -1.7666015625, -0.748779296875, 0.26904296875, 1.286865234375, 2.3046875, 3.322509765625, 4.34033203125, 5.358154296875, 6.3759765625, 7.393798828125, 8.41162109375, 9.429443359375, 10.447265625, 11.465087890625, 12.48291015625, 13.500732421875, 14.5185546875, 15.536376953125, 16.55419921875, 17.572021484375, 18.58984375, 19.607666015625, 20.62548828125, 21.643310546875, 22.6611328125, 23.678955078125, 24.69677734375, 25.714599609375, 26.732421875, 27.750244140625, 28.76806640625, 29.785888671875, 30.8037109375, 31.821533203125, 32.83935546875, 33.857177734375, 34.875]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [2.0, 4.0, 16.0, 17.0, 20.0, 32.0, 53.0, 66.0, 72.0, 128.0, 208.0, 275.0, 421.0, 626.0, 971.0, 1424.0, 2259.0, 3407.0, 5308.0, 8227.0, 13049.0, 20508.0, 32120.0, 50952.0, 80054.0, 125089.0, 192419.0, 285647.0, 425331.0, 2627330.0, 1284892.0, 381605.0, 261464.0, 175272.0, 113483.0, 71961.0, 45899.0, 29099.0, 18359.0, 11792.0, 7519.0, 4993.0, 3062.0, 2079.0, 1379.0, 786.0, 598.0, 381.0, 268.0, 168.0, 121.0, 81.0, 57.0, 27.0, 22.0, 15.0, 21.0, 3.0, 3.0, 4.0, 0.0, 2.0, 3.0, 3.0], "bins": [-2.27734375, -2.201141357421875, -2.12493896484375, -2.048736572265625, -1.9725341796875, -1.896331787109375, -1.82012939453125, -1.743927001953125, -1.667724609375, -1.591522216796875, -1.51531982421875, -1.439117431640625, -1.3629150390625, -1.286712646484375, -1.21051025390625, -1.134307861328125, -1.05810546875, -0.981903076171875, -0.90570068359375, -0.829498291015625, -0.7532958984375, -0.677093505859375, -0.60089111328125, -0.524688720703125, -0.448486328125, -0.372283935546875, -0.29608154296875, -0.219879150390625, -0.1436767578125, -0.067474365234375, 0.00872802734375, 0.084930419921875, 0.1611328125, 0.237335205078125, 0.31353759765625, 0.389739990234375, 0.4659423828125, 0.542144775390625, 0.61834716796875, 0.694549560546875, 0.770751953125, 0.846954345703125, 0.92315673828125, 0.999359130859375, 1.0755615234375, 1.151763916015625, 1.22796630859375, 1.304168701171875, 1.38037109375, 1.456573486328125, 1.53277587890625, 1.608978271484375, 1.6851806640625, 1.761383056640625, 1.83758544921875, 1.913787841796875, 1.989990234375, 2.066192626953125, 2.14239501953125, 2.218597412109375, 2.2947998046875, 2.371002197265625, 2.44720458984375, 2.523406982421875, 2.599609375]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 5.0, 8.0, 6.0, 5.0, 8.0, 6.0, 15.0, 7.0, 21.0, 12.0, 22.0, 22.0, 33.0, 27.0, 31.0, 37.0, 40.0, 30.0, 42.0, 36.0, 49.0, 746.0, 358.0, 43.0, 38.0, 41.0, 33.0, 29.0, 36.0, 31.0, 24.0, 30.0, 24.0, 21.0, 19.0, 13.0, 17.0, 9.0, 11.0, 15.0, 6.0, 12.0, 7.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-29.6875, -28.784912109375, -27.88232421875, -26.979736328125, -26.0771484375, -25.174560546875, -24.27197265625, -23.369384765625, -22.466796875, -21.564208984375, -20.66162109375, -19.759033203125, -18.8564453125, -17.953857421875, -17.05126953125, -16.148681640625, -15.24609375, -14.343505859375, -13.44091796875, -12.538330078125, -11.6357421875, -10.733154296875, -9.83056640625, -8.927978515625, -8.025390625, -7.122802734375, -6.22021484375, -5.317626953125, -4.4150390625, -3.512451171875, -2.60986328125, -1.707275390625, -0.8046875, 0.097900390625, 1.00048828125, 1.903076171875, 2.8056640625, 3.708251953125, 4.61083984375, 5.513427734375, 6.416015625, 7.318603515625, 8.22119140625, 9.123779296875, 10.0263671875, 10.928955078125, 11.83154296875, 12.734130859375, 13.63671875, 14.539306640625, 15.44189453125, 16.344482421875, 17.2470703125, 18.149658203125, 19.05224609375, 19.954833984375, 20.857421875, 21.760009765625, 22.66259765625, 23.565185546875, 24.4677734375, 25.370361328125, 26.27294921875, 27.175537109375, 28.078125]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 6.0, 10.0, 5.0, 2.0, 2.0, 7.0, 4.0, 10.0, 13.0, 24.0, 24.0, 42.0, 64.0, 108.0, 133.0, 169.0, 261.0, 415.0, 586.0, 942.0, 1592.0, 2746.0, 5581.0, 13349.0, 42607.0, 191923.0, 5855519.0, 123374.0, 30480.0, 10595.0, 4600.0, 2336.0, 1431.0, 847.0, 526.0, 358.0, 250.0, 136.0, 99.0, 76.0, 58.0, 34.0, 19.0, 20.0, 11.0, 16.0, 9.0, 14.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-16.75, -16.1796875, -15.609375, -15.0390625, -14.46875, -13.8984375, -13.328125, -12.7578125, -12.1875, -11.6171875, -11.046875, -10.4765625, -9.90625, -9.3359375, -8.765625, -8.1953125, -7.625, -7.0546875, -6.484375, -5.9140625, -5.34375, -4.7734375, -4.203125, -3.6328125, -3.0625, -2.4921875, -1.921875, -1.3515625, -0.78125, -0.2109375, 0.359375, 0.9296875, 1.5, 2.0703125, 2.640625, 3.2109375, 3.78125, 4.3515625, 4.921875, 5.4921875, 6.0625, 6.6328125, 7.203125, 7.7734375, 8.34375, 8.9140625, 9.484375, 10.0546875, 10.625, 11.1953125, 11.765625, 12.3359375, 12.90625, 13.4765625, 14.046875, 14.6171875, 15.1875, 15.7578125, 16.328125, 16.8984375, 17.46875, 18.0390625, 18.609375, 19.1796875, 19.75]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 4.0, 3.0, 6.0, 8.0, 6.0, 8.0, 7.0, 17.0, 14.0, 16.0, 10.0, 22.0, 22.0, 15.0, 30.0, 29.0, 32.0, 26.0, 32.0, 32.0, 43.0, 33.0, 33.0, 61.0, 825.0, 245.0, 39.0, 37.0, 40.0, 34.0, 32.0, 32.0, 35.0, 10.0, 29.0, 16.0, 17.0, 16.0, 20.0, 15.0, 12.0, 6.0, 9.0, 13.0, 9.0, 8.0, 6.0, 2.0, 3.0, 5.0, 3.0, 2.0, 0.0, 2.0, 2.0], "bins": [-24.453125, -23.7294921875, -23.005859375, -22.2822265625, -21.55859375, -20.8349609375, -20.111328125, -19.3876953125, -18.6640625, -17.9404296875, -17.216796875, -16.4931640625, -15.76953125, -15.0458984375, -14.322265625, -13.5986328125, -12.875, -12.1513671875, -11.427734375, -10.7041015625, -9.98046875, -9.2568359375, -8.533203125, -7.8095703125, -7.0859375, -6.3623046875, -5.638671875, -4.9150390625, -4.19140625, -3.4677734375, -2.744140625, -2.0205078125, -1.296875, -0.5732421875, 0.150390625, 0.8740234375, 1.59765625, 2.3212890625, 3.044921875, 3.7685546875, 4.4921875, 5.2158203125, 5.939453125, 6.6630859375, 7.38671875, 8.1103515625, 8.833984375, 9.5576171875, 10.28125, 11.0048828125, 11.728515625, 12.4521484375, 13.17578125, 13.8994140625, 14.623046875, 15.3466796875, 16.0703125, 16.7939453125, 17.517578125, 18.2412109375, 18.96484375, 19.6884765625, 20.412109375, 21.1357421875, 21.859375]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 9.0, 21.0, 22.0, 59.0, 85.0, 197.0, 263.0, 176.0, 67.0, 53.0, 14.0, 16.0, 11.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-116.6446762084961, -113.8871841430664, -111.12968444824219, -108.3721923828125, -105.61470031738281, -102.8572006225586, -100.0997085571289, -97.34220886230469, -94.584716796875, -91.82722473144531, -89.0697250366211, -86.3122329711914, -83.55473327636719, -80.7972412109375, -78.03974914550781, -75.28225708007812, -72.5247573852539, -69.76726531982422, -67.009765625, -64.25227355957031, -61.49477767944336, -58.737281799316406, -55.97978973388672, -53.222293853759766, -50.46479797363281, -47.70730209350586, -44.949806213378906, -42.19231414794922, -39.434818267822266, -36.67732238769531, -33.919830322265625, -31.162334442138672, -28.40484619140625, -25.647350311279297, -22.889856338500977, -20.132362365722656, -17.374866485595703, -14.617371559143066, -11.85987663269043, -9.10238265991211, -6.344886779785156, -3.5873918533325195, -0.8298969268798828, 1.927597999572754, 4.685092926025391, 7.442587852478027, 10.200082778930664, 12.957576751708984, 15.715072631835938, 18.47256851196289, 21.23006248474121, 23.98755645751953, 26.745052337646484, 29.502548217773438, 32.260040283203125, 35.01753616333008, 37.77503204345703, 40.532527923583984, 43.29002380371094, 46.047515869140625, 48.80501174926758, 51.56250762939453, 54.31999969482422, 57.07749557495117, 59.834991455078125]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 8.0, 5.0, 20.0, 33.0, 48.0, 57.0, 53.0, 81.0, 83.0, 81.0, 89.0, 76.0, 77.0, 75.0, 55.0, 59.0, 47.0, 23.0, 15.0, 16.0, 8.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-169.69186401367188, -165.88055419921875, -162.06924438476562, -158.2579345703125, -154.44662475585938, -150.63531494140625, -146.82400512695312, -143.0126953125, -139.20138549804688, -135.39007568359375, -131.57876586914062, -127.7674560546875, -123.95614624023438, -120.14483642578125, -116.33352661132812, -112.522216796875, -108.71090698242188, -104.89959716796875, -101.08828735351562, -97.2769775390625, -93.46566772460938, -89.65435791015625, -85.84304809570312, -82.03173828125, -78.22042846679688, -74.40911865234375, -70.59780883789062, -66.7864990234375, -62.975189208984375, -59.16387939453125, -55.352569580078125, -51.541259765625, -47.729949951171875, -43.91864013671875, -40.107330322265625, -36.2960205078125, -32.484710693359375, -28.67340087890625, -24.862091064453125, -21.05078125, -17.239471435546875, -13.42816162109375, -9.616851806640625, -5.8055419921875, -1.994232177734375, 1.81707763671875, 5.628387451171875, 9.439697265625, 13.251007080078125, 17.06231689453125, 20.873626708984375, 24.6849365234375, 28.496246337890625, 32.30755615234375, 36.118865966796875, 39.93017578125, 43.741485595703125, 47.55279541015625, 51.364105224609375, 55.1754150390625, 58.986724853515625, 62.79803466796875, 66.60934448242188, 70.420654296875, 74.23196411132812]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 6.0, 2.0, 3.0, 1.0, 2.0, 4.0, 8.0, 6.0, 16.0, 8.0, 11.0, 10.0, 19.0, 23.0, 19.0, 29.0, 44.0, 48.0, 69.0, 113.0, 185.0, 298.0, 508.0, 1046.0, 2349.0, 5823.0, 23612.0, 4058896.0, 84904.0, 10177.0, 3308.0, 1309.0, 631.0, 303.0, 188.0, 122.0, 63.0, 46.0, 28.0, 18.0, 11.0, 8.0, 6.0, 2.0, 3.0, 2.0], "bins": [-2.69921875, -2.6402130126953125, -2.581207275390625, -2.5222015380859375, -2.46319580078125, -2.4041900634765625, -2.345184326171875, -2.2861785888671875, -2.2271728515625, -2.1681671142578125, -2.109161376953125, -2.0501556396484375, -1.99114990234375, -1.9321441650390625, -1.873138427734375, -1.8141326904296875, -1.755126953125, -1.6961212158203125, -1.637115478515625, -1.5781097412109375, -1.51910400390625, -1.4600982666015625, -1.401092529296875, -1.3420867919921875, -1.2830810546875, -1.2240753173828125, -1.165069580078125, -1.1060638427734375, -1.04705810546875, -0.9880523681640625, -0.929046630859375, -0.8700408935546875, -0.81103515625, -0.7520294189453125, -0.693023681640625, -0.6340179443359375, -0.57501220703125, -0.5160064697265625, -0.457000732421875, -0.3979949951171875, -0.3389892578125, -0.2799835205078125, -0.220977783203125, -0.1619720458984375, -0.10296630859375, -0.0439605712890625, 0.015045166015625, 0.0740509033203125, 0.133056640625, 0.1920623779296875, 0.251068115234375, 0.3100738525390625, 0.36907958984375, 0.4280853271484375, 0.487091064453125, 0.5460968017578125, 0.6051025390625, 0.6641082763671875, 0.723114013671875, 0.7821197509765625, 0.84112548828125, 0.9001312255859375, 0.959136962890625, 1.0181427001953125, 1.0771484375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 5.0, 8.0, 13.0, 10.0, 29.0, 36.0, 795.0, 31.0, 32.0, 19.0, 8.0, 10.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8837890625, -0.8643226623535156, -0.8448562622070312, -0.8253898620605469, -0.8059234619140625, -0.7864570617675781, -0.7669906616210938, -0.7475242614746094, -0.728057861328125, -0.7085914611816406, -0.6891250610351562, -0.6696586608886719, -0.6501922607421875, -0.6307258605957031, -0.6112594604492188, -0.5917930603027344, -0.57232666015625, -0.5528602600097656, -0.5333938598632812, -0.5139274597167969, -0.4944610595703125, -0.4749946594238281, -0.45552825927734375, -0.4360618591308594, -0.416595458984375, -0.3971290588378906, -0.37766265869140625, -0.3581962585449219, -0.3387298583984375, -0.3192634582519531, -0.29979705810546875, -0.2803306579589844, -0.2608642578125, -0.24139785766601562, -0.22193145751953125, -0.20246505737304688, -0.1829986572265625, -0.16353225708007812, -0.14406585693359375, -0.12459945678710938, -0.105133056640625, -0.08566665649414062, -0.06620025634765625, -0.046733856201171875, -0.0272674560546875, -0.007801055908203125, 0.01166534423828125, 0.031131744384765625, 0.05059814453125, 0.07006454467773438, 0.08953094482421875, 0.10899734497070312, 0.1284637451171875, 0.14793014526367188, 0.16739654541015625, 0.18686294555664062, 0.206329345703125, 0.22579574584960938, 0.24526214599609375, 0.2647285461425781, 0.2841949462890625, 0.3036613464355469, 0.32312774658203125, 0.3425941467285156, 0.362060546875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 5.0, 18.0, 10.0, 14.0, 20.0, 21.0, 30.0, 49.0, 72.0, 127.0, 176.0, 288.0, 501.0, 974.0, 1920.0, 4314.0, 10652.0, 32099.0, 146876.0, 3491009.0, 419056.0, 57066.0, 16462.0, 6344.0, 2817.0, 1422.0, 758.0, 394.0, 232.0, 143.0, 121.0, 66.0, 58.0, 42.0, 25.0, 25.0, 18.0, 9.0, 14.0, 6.0, 10.0, 5.0, 6.0, 2.0, 2.0, 5.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-1.107421875, -1.0735626220703125, -1.039703369140625, -1.0058441162109375, -0.97198486328125, -0.9381256103515625, -0.904266357421875, -0.8704071044921875, -0.8365478515625, -0.8026885986328125, -0.768829345703125, -0.7349700927734375, -0.70111083984375, -0.6672515869140625, -0.633392333984375, -0.5995330810546875, -0.565673828125, -0.5318145751953125, -0.497955322265625, -0.4640960693359375, -0.43023681640625, -0.3963775634765625, -0.362518310546875, -0.3286590576171875, -0.2947998046875, -0.2609405517578125, -0.227081298828125, -0.1932220458984375, -0.15936279296875, -0.1255035400390625, -0.091644287109375, -0.0577850341796875, -0.02392578125, 0.0099334716796875, 0.043792724609375, 0.0776519775390625, 0.11151123046875, 0.1453704833984375, 0.179229736328125, 0.2130889892578125, 0.2469482421875, 0.2808074951171875, 0.314666748046875, 0.3485260009765625, 0.38238525390625, 0.4162445068359375, 0.450103759765625, 0.4839630126953125, 0.517822265625, 0.5516815185546875, 0.585540771484375, 0.6194000244140625, 0.65325927734375, 0.6871185302734375, 0.720977783203125, 0.7548370361328125, 0.7886962890625, 0.8225555419921875, 0.856414794921875, 0.8902740478515625, 0.92413330078125, 0.9579925537109375, 0.991851806640625, 1.0257110595703125, 1.0595703125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 4.0, 0.0, 0.0, 2.0, 4.0, 1.0, 7.0, 3.0, 4.0, 10.0, 15.0, 15.0, 19.0, 25.0, 39.0, 53.0, 83.0, 146.0, 407.0, 1766.0, 802.0, 252.0, 132.0, 97.0, 50.0, 40.0, 25.0, 18.0, 15.0, 11.0, 10.0, 2.0, 4.0, 1.0, 5.0, 2.0, 5.0, 2.0, 3.0, 0.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.47705078125, -0.4633216857910156, -0.44959259033203125, -0.4358634948730469, -0.4221343994140625, -0.4084053039550781, -0.39467620849609375, -0.3809471130371094, -0.367218017578125, -0.3534889221191406, -0.33975982666015625, -0.3260307312011719, -0.3123016357421875, -0.2985725402832031, -0.28484344482421875, -0.2711143493652344, -0.25738525390625, -0.24365615844726562, -0.22992706298828125, -0.21619796752929688, -0.2024688720703125, -0.18873977661132812, -0.17501068115234375, -0.16128158569335938, -0.147552490234375, -0.13382339477539062, -0.12009429931640625, -0.10636520385742188, -0.0926361083984375, -0.07890701293945312, -0.06517791748046875, -0.051448822021484375, -0.0377197265625, -0.023990631103515625, -0.01026153564453125, 0.003467559814453125, 0.0171966552734375, 0.030925750732421875, 0.04465484619140625, 0.058383941650390625, 0.072113037109375, 0.08584213256835938, 0.09957122802734375, 0.11330032348632812, 0.1270294189453125, 0.14075851440429688, 0.15448760986328125, 0.16821670532226562, 0.18194580078125, 0.19567489624023438, 0.20940399169921875, 0.22313308715820312, 0.2368621826171875, 0.2505912780761719, 0.26432037353515625, 0.2780494689941406, 0.291778564453125, 0.3055076599121094, 0.31923675537109375, 0.3329658508300781, 0.3466949462890625, 0.3604240417480469, 0.37415313720703125, 0.3878822326660156, 0.401611328125]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 4.0, 11.0, 15.0, 68.0, 238.0, 351.0, 216.0, 64.0, 22.0, 12.0, 6.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2942087650299072, -1.1551530361175537, -1.0160973072052002, -0.8770414590835571, -0.7379857301712036, -0.5989300012588501, -0.4598742127418518, -0.3208184242248535, -0.1817626953125, -0.0427069365978241, 0.0963488221168518, 0.2354045808315277, 0.3744603395462036, 0.5135160684585571, 0.6525718569755554, 0.7916276454925537, 0.9306833744049072, 1.0697391033172607, 1.2087948322296143, 1.3478506803512573, 1.4869064092636108, 1.6259621381759644, 1.7650179862976074, 1.904073715209961, 2.0431294441223145, 2.182185173034668, 2.3212409019470215, 2.460296630859375, 2.5993523597717285, 2.738408088684082, 2.8774640560150146, 3.016519784927368, 3.1555752754211426, 3.294631004333496, 3.4336867332458496, 3.572742462158203, 3.7117981910705566, 3.85085391998291, 3.9899098873138428, 4.128965377807617, 4.268021583557129, 4.407077312469482, 4.546133041381836, 4.6851887702941895, 4.824244499206543, 4.9633002281188965, 5.10235595703125, 5.241412162780762, 5.380467414855957, 5.5195231437683105, 5.658578872680664, 5.797634601593018, 5.936690330505371, 6.075746059417725, 6.214801788330078, 6.35385799407959, 6.492913246154785, 6.631968975067139, 6.771024703979492, 6.910080432891846, 7.049136161804199, 7.188191890716553, 7.327247619628906, 7.466303825378418, 7.6053595542907715]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 7.0, 12.0, 15.0, 24.0, 40.0, 49.0, 75.0, 94.0, 89.0, 101.0, 101.0, 91.0, 53.0, 76.0, 61.0, 40.0, 26.0, 12.0, 12.0, 6.0, 8.0, 6.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5944769382476807, -1.5182729959487915, -1.4420689344406128, -1.3658649921417236, -1.289660930633545, -1.2134569883346558, -1.1372530460357666, -1.061048984527588, -0.9848450422286987, -0.9086410403251648, -0.8324370384216309, -0.7562330961227417, -0.6800290942192078, -0.6038250923156738, -0.5276211500167847, -0.45141714811325073, -0.3752131462097168, -0.29900914430618286, -0.2228051722049713, -0.14660118520259857, -0.07039719820022583, 0.0058068037033081055, 0.08201077580451965, 0.1582147479057312, 0.23441874980926514, 0.3106227517127991, 0.3868267238140106, 0.46303069591522217, 0.5392346978187561, 0.61543869972229, 0.6916426420211792, 0.7678466439247131, 0.8440508842468262, 0.9202548861503601, 0.996458888053894, 1.0726628303527832, 1.148866891860962, 1.225070834159851, 1.3012747764587402, 1.377478837966919, 1.453682780265808, 1.5298867225646973, 1.606090784072876, 1.6822947263717651, 1.7584986686706543, 1.834702730178833, 1.9109066724777222, 1.9871106147766113, 2.06331467628479, 2.1395187377929688, 2.2157225608825684, 2.291926622390747, 2.368130683898926, 2.4443345069885254, 2.520538568496704, 2.596742630004883, 2.6729464530944824, 2.749150514602661, 2.8253543376922607, 2.9015583992004395, 2.977762460708618, 3.053966522216797, 3.1301703453063965, 3.206374406814575, 3.282578468322754]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 4.0, 1.0, 3.0, 6.0, 6.0, 7.0, 9.0, 6.0, 17.0, 22.0, 23.0, 26.0, 41.0, 57.0, 87.0, 153.0, 301.0, 516.0, 1226.0, 3286.0, 10223.0, 49757.0, 938304.0, 31933.0, 7914.0, 2530.0, 980.0, 430.0, 224.0, 129.0, 85.0, 61.0, 38.0, 38.0, 30.0, 18.0, 11.0, 13.0, 10.0, 10.0, 7.0, 4.0, 4.0, 7.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.39453125, -3.295806884765625, -3.19708251953125, -3.098358154296875, -2.9996337890625, -2.900909423828125, -2.80218505859375, -2.703460693359375, -2.604736328125, -2.506011962890625, -2.40728759765625, -2.308563232421875, -2.2098388671875, -2.111114501953125, -2.01239013671875, -1.913665771484375, -1.81494140625, -1.716217041015625, -1.61749267578125, -1.518768310546875, -1.4200439453125, -1.321319580078125, -1.22259521484375, -1.123870849609375, -1.025146484375, -0.926422119140625, -0.82769775390625, -0.728973388671875, -0.6302490234375, -0.531524658203125, -0.43280029296875, -0.334075927734375, -0.2353515625, -0.136627197265625, -0.03790283203125, 0.060821533203125, 0.1595458984375, 0.258270263671875, 0.35699462890625, 0.455718994140625, 0.554443359375, 0.653167724609375, 0.75189208984375, 0.850616455078125, 0.9493408203125, 1.048065185546875, 1.14678955078125, 1.245513916015625, 1.34423828125, 1.442962646484375, 1.54168701171875, 1.640411376953125, 1.7391357421875, 1.837860107421875, 1.93658447265625, 2.035308837890625, 2.134033203125, 2.232757568359375, 2.33148193359375, 2.430206298828125, 2.5289306640625, 2.627655029296875, 2.72637939453125, 2.825103759765625, 2.923828125]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 3.0, 4.0, 6.0, 9.0, 12.0, 18.0, 26.0, 220.0, 602.0, 33.0, 32.0, 13.0, 4.0, 14.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7236328125, -0.706878662109375, -0.69012451171875, -0.673370361328125, -0.6566162109375, -0.639862060546875, -0.62310791015625, -0.606353759765625, -0.589599609375, -0.572845458984375, -0.55609130859375, -0.539337158203125, -0.5225830078125, -0.505828857421875, -0.48907470703125, -0.472320556640625, -0.45556640625, -0.438812255859375, -0.42205810546875, -0.405303955078125, -0.3885498046875, -0.371795654296875, -0.35504150390625, -0.338287353515625, -0.321533203125, -0.304779052734375, -0.28802490234375, -0.271270751953125, -0.2545166015625, -0.237762451171875, -0.22100830078125, -0.204254150390625, -0.1875, -0.170745849609375, -0.15399169921875, -0.137237548828125, -0.1204833984375, -0.103729248046875, -0.08697509765625, -0.070220947265625, -0.053466796875, -0.036712646484375, -0.01995849609375, -0.003204345703125, 0.0135498046875, 0.030303955078125, 0.04705810546875, 0.063812255859375, 0.08056640625, 0.097320556640625, 0.11407470703125, 0.130828857421875, 0.1475830078125, 0.164337158203125, 0.18109130859375, 0.197845458984375, 0.214599609375, 0.231353759765625, 0.24810791015625, 0.264862060546875, 0.2816162109375, 0.298370361328125, 0.31512451171875, 0.331878662109375, 0.3486328125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 2.0, 3.0, 6.0, 11.0, 15.0, 22.0, 31.0, 52.0, 68.0, 84.0, 146.0, 260.0, 427.0, 809.0, 1575.0, 3864.0, 11038.0, 46920.0, 308835.0, 564139.0, 83206.0, 17404.0, 5313.0, 2004.0, 977.0, 519.0, 298.0, 178.0, 103.0, 80.0, 53.0, 33.0, 20.0, 22.0, 11.0, 6.0, 6.0, 4.0, 0.0, 3.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.57421875, -1.523712158203125, -1.47320556640625, -1.422698974609375, -1.3721923828125, -1.321685791015625, -1.27117919921875, -1.220672607421875, -1.170166015625, -1.119659423828125, -1.06915283203125, -1.018646240234375, -0.9681396484375, -0.917633056640625, -0.86712646484375, -0.816619873046875, -0.76611328125, -0.715606689453125, -0.66510009765625, -0.614593505859375, -0.5640869140625, -0.513580322265625, -0.46307373046875, -0.412567138671875, -0.362060546875, -0.311553955078125, -0.26104736328125, -0.210540771484375, -0.1600341796875, -0.109527587890625, -0.05902099609375, -0.008514404296875, 0.0419921875, 0.092498779296875, 0.14300537109375, 0.193511962890625, 0.2440185546875, 0.294525146484375, 0.34503173828125, 0.395538330078125, 0.446044921875, 0.496551513671875, 0.54705810546875, 0.597564697265625, 0.6480712890625, 0.698577880859375, 0.74908447265625, 0.799591064453125, 0.85009765625, 0.900604248046875, 0.95111083984375, 1.001617431640625, 1.0521240234375, 1.102630615234375, 1.15313720703125, 1.203643798828125, 1.254150390625, 1.304656982421875, 1.35516357421875, 1.405670166015625, 1.4561767578125, 1.506683349609375, 1.55718994140625, 1.607696533203125, 1.658203125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 4.0, 4.0, 8.0, 4.0, 5.0, 5.0, 8.0, 10.0, 6.0, 16.0, 10.0, 22.0, 21.0, 19.0, 22.0, 30.0, 21.0, 21.0, 31.0, 33.0, 38.0, 34.0, 50.0, 36.0, 45.0, 47.0, 41.0, 48.0, 40.0, 40.0, 30.0, 41.0, 23.0, 34.0, 28.0, 18.0, 16.0, 24.0, 14.0, 13.0, 13.0, 6.0, 5.0, 2.0, 6.0, 2.0, 5.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.0859375, -1.051116943359375, -1.01629638671875, -0.981475830078125, -0.9466552734375, -0.911834716796875, -0.87701416015625, -0.842193603515625, -0.807373046875, -0.772552490234375, -0.73773193359375, -0.702911376953125, -0.6680908203125, -0.633270263671875, -0.59844970703125, -0.563629150390625, -0.52880859375, -0.493988037109375, -0.45916748046875, -0.424346923828125, -0.3895263671875, -0.354705810546875, -0.31988525390625, -0.285064697265625, -0.250244140625, -0.215423583984375, -0.18060302734375, -0.145782470703125, -0.1109619140625, -0.076141357421875, -0.04132080078125, -0.006500244140625, 0.0283203125, 0.063140869140625, 0.09796142578125, 0.132781982421875, 0.1676025390625, 0.202423095703125, 0.23724365234375, 0.272064208984375, 0.306884765625, 0.341705322265625, 0.37652587890625, 0.411346435546875, 0.4461669921875, 0.480987548828125, 0.51580810546875, 0.550628662109375, 0.58544921875, 0.620269775390625, 0.65509033203125, 0.689910888671875, 0.7247314453125, 0.759552001953125, 0.79437255859375, 0.829193115234375, 0.864013671875, 0.898834228515625, 0.93365478515625, 0.968475341796875, 1.0032958984375, 1.038116455078125, 1.07293701171875, 1.107757568359375, 1.142578125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 1.0, 5.0, 5.0, 11.0, 14.0, 13.0, 20.0, 38.0, 50.0, 97.0, 181.0, 428.0, 1322.0, 6623.0, 406011.0, 624120.0, 7250.0, 1408.0, 439.0, 236.0, 96.0, 69.0, 43.0, 23.0, 20.0, 11.0, 9.0, 2.0, 1.0, 4.0, 0.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.484375, -4.352569580078125, -4.22076416015625, -4.088958740234375, -3.9571533203125, -3.825347900390625, -3.69354248046875, -3.561737060546875, -3.429931640625, -3.298126220703125, -3.16632080078125, -3.034515380859375, -2.9027099609375, -2.770904541015625, -2.63909912109375, -2.507293701171875, -2.37548828125, -2.243682861328125, -2.11187744140625, -1.980072021484375, -1.8482666015625, -1.716461181640625, -1.58465576171875, -1.452850341796875, -1.321044921875, -1.189239501953125, -1.05743408203125, -0.925628662109375, -0.7938232421875, -0.662017822265625, -0.53021240234375, -0.398406982421875, -0.2666015625, -0.134796142578125, -0.00299072265625, 0.128814697265625, 0.2606201171875, 0.392425537109375, 0.52423095703125, 0.656036376953125, 0.787841796875, 0.919647216796875, 1.05145263671875, 1.183258056640625, 1.3150634765625, 1.446868896484375, 1.57867431640625, 1.710479736328125, 1.84228515625, 1.974090576171875, 2.10589599609375, 2.237701416015625, 2.3695068359375, 2.501312255859375, 2.63311767578125, 2.764923095703125, 2.896728515625, 3.028533935546875, 3.16033935546875, 3.292144775390625, 3.4239501953125, 3.555755615234375, 3.68756103515625, 3.819366455078125, 3.951171875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 5.0, 8.0, 8.0, 9.0, 16.0, 19.0, 21.0, 44.0, 48.0, 81.0, 132.0, 149.0, 127.0, 108.0, 92.0, 50.0, 30.0, 17.0, 10.0, 10.0, 5.0, 3.0, 3.0, 3.0, 5.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.200241088867188e-05, -6.867572665214539e-05, -6.53490424156189e-05, -6.202235817909241e-05, -5.869567394256592e-05, -5.536898970603943e-05, -5.204230546951294e-05, -4.871562123298645e-05, -4.538893699645996e-05, -4.206225275993347e-05, -3.873556852340698e-05, -3.540888428688049e-05, -3.2082200050354004e-05, -2.8755515813827515e-05, -2.5428831577301025e-05, -2.2102147340774536e-05, -1.8775463104248047e-05, -1.5448778867721558e-05, -1.2122094631195068e-05, -8.795410394668579e-06, -5.46872615814209e-06, -2.1420419216156006e-06, 1.1846423149108887e-06, 4.511326551437378e-06, 7.838010787963867e-06, 1.1164695024490356e-05, 1.4491379261016846e-05, 1.7818063497543335e-05, 2.1144747734069824e-05, 2.4471431970596313e-05, 2.7798116207122803e-05, 3.112480044364929e-05, 3.445148468017578e-05, 3.777816891670227e-05, 4.110485315322876e-05, 4.443153738975525e-05, 4.775822162628174e-05, 5.108490586280823e-05, 5.441159009933472e-05, 5.7738274335861206e-05, 6.10649585723877e-05, 6.439164280891418e-05, 6.771832704544067e-05, 7.104501128196716e-05, 7.437169551849365e-05, 7.769837975502014e-05, 8.102506399154663e-05, 8.435174822807312e-05, 8.767843246459961e-05, 9.10051167011261e-05, 9.433180093765259e-05, 9.765848517417908e-05, 0.00010098516941070557, 0.00010431185364723206, 0.00010763853788375854, 0.00011096522212028503, 0.00011429190635681152, 0.00011761859059333801, 0.0001209452748298645, 0.000124271959066391, 0.00012759864330291748, 0.00013092532753944397, 0.00013425201177597046, 0.00013757869601249695, 0.00014090538024902344]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 5.0, 8.0, 8.0, 9.0, 20.0, 33.0, 38.0, 53.0, 114.0, 190.0, 384.0, 830.0, 2316.0, 8876.0, 103814.0, 889124.0, 34619.0, 5173.0, 1626.0, 648.0, 274.0, 152.0, 86.0, 59.0, 25.0, 26.0, 14.0, 16.0, 9.0, 2.0, 1.0, 5.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.111328125, -3.02325439453125, -2.9351806640625, -2.84710693359375, -2.759033203125, -2.67095947265625, -2.5828857421875, -2.49481201171875, -2.40673828125, -2.31866455078125, -2.2305908203125, -2.14251708984375, -2.054443359375, -1.96636962890625, -1.8782958984375, -1.79022216796875, -1.7021484375, -1.61407470703125, -1.5260009765625, -1.43792724609375, -1.349853515625, -1.26177978515625, -1.1737060546875, -1.08563232421875, -0.99755859375, -0.90948486328125, -0.8214111328125, -0.73333740234375, -0.645263671875, -0.55718994140625, -0.4691162109375, -0.38104248046875, -0.29296875, -0.20489501953125, -0.1168212890625, -0.02874755859375, 0.059326171875, 0.14739990234375, 0.2354736328125, 0.32354736328125, 0.41162109375, 0.49969482421875, 0.5877685546875, 0.67584228515625, 0.763916015625, 0.85198974609375, 0.9400634765625, 1.02813720703125, 1.1162109375, 1.20428466796875, 1.2923583984375, 1.38043212890625, 1.468505859375, 1.55657958984375, 1.6446533203125, 1.73272705078125, 1.82080078125, 1.90887451171875, 1.9969482421875, 2.08502197265625, 2.173095703125, 2.26116943359375, 2.3492431640625, 2.43731689453125, 2.525390625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 6.0, 2.0, 7.0, 8.0, 11.0, 23.0, 23.0, 38.0, 65.0, 85.0, 138.0, 149.0, 135.0, 121.0, 68.0, 44.0, 31.0, 29.0, 5.0, 9.0, 5.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5458984375, -1.4880523681640625, -1.430206298828125, -1.3723602294921875, -1.31451416015625, -1.2566680908203125, -1.198822021484375, -1.1409759521484375, -1.0831298828125, -1.0252838134765625, -0.967437744140625, -0.9095916748046875, -0.85174560546875, -0.7938995361328125, -0.736053466796875, -0.6782073974609375, -0.620361328125, -0.5625152587890625, -0.504669189453125, -0.4468231201171875, -0.38897705078125, -0.3311309814453125, -0.273284912109375, -0.2154388427734375, -0.1575927734375, -0.0997467041015625, -0.041900634765625, 0.0159454345703125, 0.07379150390625, 0.1316375732421875, 0.189483642578125, 0.2473297119140625, 0.30517578125, 0.3630218505859375, 0.420867919921875, 0.4787139892578125, 0.53656005859375, 0.5944061279296875, 0.652252197265625, 0.7100982666015625, 0.7679443359375, 0.8257904052734375, 0.883636474609375, 0.9414825439453125, 0.99932861328125, 1.0571746826171875, 1.115020751953125, 1.1728668212890625, 1.230712890625, 1.2885589599609375, 1.346405029296875, 1.4042510986328125, 1.46209716796875, 1.5199432373046875, 1.577789306640625, 1.6356353759765625, 1.6934814453125, 1.7513275146484375, 1.809173583984375, 1.8670196533203125, 1.92486572265625, 1.9827117919921875, 2.040557861328125, 2.0984039306640625, 2.15625]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 8.0, 41.0, 259.0, 588.0, 79.0, 19.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.32780838012695, -45.94390106201172, -44.55999755859375, -43.176090240478516, -41.79218292236328, -40.40827941894531, -39.02437210083008, -37.640464782714844, -36.256561279296875, -34.87265396118164, -33.48875045776367, -32.10484313964844, -30.720935821533203, -29.3370304107666, -27.953125, -26.569217681884766, -25.18531036376953, -23.80140495300293, -22.417497634887695, -21.033592224121094, -19.64968490600586, -18.265779495239258, -16.881874084472656, -15.497967720031738, -14.11406135559082, -12.730154991149902, -11.346248626708984, -9.962343215942383, -8.578436851501465, -7.194530487060547, -5.810625076293945, -4.426718711853027, -3.042816162109375, -1.6589100360870361, -0.27500391006469727, 1.1089019775390625, 2.4928083419799805, 3.8767147064208984, 5.2606201171875, 6.644526481628418, 8.028432846069336, 9.412339210510254, 10.796245574951172, 12.180150985717773, 13.564057350158691, 14.94796371459961, 16.33186912536621, 17.715774536132812, 19.099681854248047, 20.48358726501465, 21.867494583129883, 23.251399993896484, 24.63530731201172, 26.01921272277832, 27.403118133544922, 28.787025451660156, 30.170930862426758, 31.55483627319336, 32.938743591308594, 34.32264709472656, 35.7065544128418, 37.09046173095703, 38.474365234375, 39.858272552490234, 41.24217987060547]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 5.0, 5.0, 6.0, 10.0, 6.0, 15.0, 20.0, 37.0, 57.0, 87.0, 118.0, 135.0, 146.0, 111.0, 79.0, 71.0, 26.0, 15.0, 11.0, 11.0, 3.0, 8.0, 4.0, 3.0, 4.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.342493057250977, -22.585756301879883, -21.829021453857422, -21.072284698486328, -20.315549850463867, -19.558813095092773, -18.802078247070312, -18.04534149169922, -17.288604736328125, -16.53186798095703, -15.77513313293457, -15.018396377563477, -14.261661529541016, -13.504924774169922, -12.748188972473145, -11.991453170776367, -11.234718322753906, -10.477982521057129, -9.721246719360352, -8.964509963989258, -8.207775115966797, -7.451038837432861, -6.694302558898926, -5.937566757202148, -5.180830955505371, -4.424095153808594, -3.6673591136932373, -2.910623073577881, -2.1538872718811035, -1.3971514701843262, -0.6404151916503906, 0.11632061004638672, 0.8730564117431641, 1.629792332649231, 2.386528253555298, 3.1432642936706543, 3.9000000953674316, 4.656735897064209, 5.4134721755981445, 6.170207977294922, 6.926943778991699, 7.683679580688477, 8.440415382385254, 9.197151184082031, 9.953887939453125, 10.710622787475586, 11.46735954284668, 12.224095344543457, 12.980831146240234, 13.737566947937012, 14.494302749633789, 15.251039505004883, 16.007774353027344, 16.764511108398438, 17.52124786376953, 18.277982711791992, 19.034717559814453, 19.791454315185547, 20.548189163208008, 21.3049259185791, 22.061660766601562, 22.818397521972656, 23.57513427734375, 24.33186912536621, 25.088605880737305]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 6.0, 10.0, 14.0, 37.0, 65.0, 120.0, 344.0, 1512.0, 9045.0, 3846589.0, 329982.0, 5370.0, 882.0, 205.0, 58.0, 29.0, 13.0, 4.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-16.6875, -16.353271484375, -16.01904296875, -15.684814453125, -15.3505859375, -15.016357421875, -14.68212890625, -14.347900390625, -14.013671875, -13.679443359375, -13.34521484375, -13.010986328125, -12.6767578125, -12.342529296875, -12.00830078125, -11.674072265625, -11.33984375, -11.005615234375, -10.67138671875, -10.337158203125, -10.0029296875, -9.668701171875, -9.33447265625, -9.000244140625, -8.666015625, -8.331787109375, -7.99755859375, -7.663330078125, -7.3291015625, -6.994873046875, -6.66064453125, -6.326416015625, -5.9921875, -5.657958984375, -5.32373046875, -4.989501953125, -4.6552734375, -4.321044921875, -3.98681640625, -3.652587890625, -3.318359375, -2.984130859375, -2.64990234375, -2.315673828125, -1.9814453125, -1.647216796875, -1.31298828125, -0.978759765625, -0.64453125, -0.310302734375, 0.02392578125, 0.358154296875, 0.6923828125, 1.026611328125, 1.36083984375, 1.695068359375, 2.029296875, 2.363525390625, 2.69775390625, 3.031982421875, 3.3662109375, 3.700439453125, 4.03466796875, 4.368896484375, 4.703125]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 8.0, 5.0, 4.0, 7.0, 9.0, 11.0, 13.0, 16.0, 35.0, 83.0, 191.0, 307.0, 153.0, 60.0, 31.0, 16.0, 9.0, 15.0, 6.0, 8.0, 1.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.3408203125, -0.33235931396484375, -0.3238983154296875, -0.31543731689453125, -0.306976318359375, -0.29851531982421875, -0.2900543212890625, -0.28159332275390625, -0.27313232421875, -0.26467132568359375, -0.2562103271484375, -0.24774932861328125, -0.239288330078125, -0.23082733154296875, -0.2223663330078125, -0.21390533447265625, -0.2054443359375, -0.19698333740234375, -0.1885223388671875, -0.18006134033203125, -0.171600341796875, -0.16313934326171875, -0.1546783447265625, -0.14621734619140625, -0.13775634765625, -0.12929534912109375, -0.1208343505859375, -0.11237335205078125, -0.103912353515625, -0.09545135498046875, -0.0869903564453125, -0.07852935791015625, -0.070068359375, -0.06160736083984375, -0.0531463623046875, -0.04468536376953125, -0.036224365234375, -0.02776336669921875, -0.0193023681640625, -0.01084136962890625, -0.00238037109375, 0.00608062744140625, 0.0145416259765625, 0.02300262451171875, 0.031463623046875, 0.03992462158203125, 0.0483856201171875, 0.05684661865234375, 0.0653076171875, 0.07376861572265625, 0.0822296142578125, 0.09069061279296875, 0.099151611328125, 0.10761260986328125, 0.1160736083984375, 0.12453460693359375, 0.13299560546875, 0.14145660400390625, 0.1499176025390625, 0.15837860107421875, 0.166839599609375, 0.17530059814453125, 0.1837615966796875, 0.19222259521484375, 0.20068359375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 5.0, 4.0, 9.0, 10.0, 14.0, 34.0, 61.0, 125.0, 253.0, 654.0, 2148.0, 9659.0, 94355.0, 3936005.0, 134627.0, 12373.0, 2549.0, 823.0, 324.0, 130.0, 61.0, 33.0, 17.0, 5.0, 8.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3046875, -4.186920166015625, -4.06915283203125, -3.951385498046875, -3.8336181640625, -3.715850830078125, -3.59808349609375, -3.480316162109375, -3.362548828125, -3.244781494140625, -3.12701416015625, -3.009246826171875, -2.8914794921875, -2.773712158203125, -2.65594482421875, -2.538177490234375, -2.42041015625, -2.302642822265625, -2.18487548828125, -2.067108154296875, -1.9493408203125, -1.831573486328125, -1.71380615234375, -1.596038818359375, -1.478271484375, -1.360504150390625, -1.24273681640625, -1.124969482421875, -1.0072021484375, -0.889434814453125, -0.77166748046875, -0.653900146484375, -0.5361328125, -0.418365478515625, -0.30059814453125, -0.182830810546875, -0.0650634765625, 0.052703857421875, 0.17047119140625, 0.288238525390625, 0.406005859375, 0.523773193359375, 0.64154052734375, 0.759307861328125, 0.8770751953125, 0.994842529296875, 1.11260986328125, 1.230377197265625, 1.34814453125, 1.465911865234375, 1.58367919921875, 1.701446533203125, 1.8192138671875, 1.936981201171875, 2.05474853515625, 2.172515869140625, 2.290283203125, 2.408050537109375, 2.52581787109375, 2.643585205078125, 2.7613525390625, 2.879119873046875, 2.99688720703125, 3.114654541015625, 3.232421875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 3.0, 2.0, 5.0, 4.0, 5.0, 7.0, 8.0, 15.0, 8.0, 11.0, 26.0, 39.0, 42.0, 66.0, 85.0, 160.0, 438.0, 1453.0, 962.0, 302.0, 137.0, 71.0, 57.0, 35.0, 36.0, 31.0, 13.0, 13.0, 9.0, 11.0, 6.0, 5.0, 4.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.34765625, -0.3373756408691406, -0.32709503173828125, -0.3168144226074219, -0.3065338134765625, -0.2962532043457031, -0.28597259521484375, -0.2756919860839844, -0.265411376953125, -0.2551307678222656, -0.24485015869140625, -0.23456954956054688, -0.2242889404296875, -0.21400833129882812, -0.20372772216796875, -0.19344711303710938, -0.18316650390625, -0.17288589477539062, -0.16260528564453125, -0.15232467651367188, -0.1420440673828125, -0.13176345825195312, -0.12148284912109375, -0.11120223999023438, -0.100921630859375, -0.09064102172851562, -0.08036041259765625, -0.07007980346679688, -0.0597991943359375, -0.049518585205078125, -0.03923797607421875, -0.028957366943359375, -0.0186767578125, -0.008396148681640625, 0.00188446044921875, 0.012165069580078125, 0.0224456787109375, 0.032726287841796875, 0.04300689697265625, 0.053287506103515625, 0.063568115234375, 0.07384872436523438, 0.08412933349609375, 0.09440994262695312, 0.1046905517578125, 0.11497116088867188, 0.12525177001953125, 0.13553237915039062, 0.14581298828125, 0.15609359741210938, 0.16637420654296875, 0.17665481567382812, 0.1869354248046875, 0.19721603393554688, 0.20749664306640625, 0.21777725219726562, 0.228057861328125, 0.23833847045898438, 0.24861907958984375, 0.2588996887207031, 0.2691802978515625, 0.2794609069824219, 0.28974151611328125, 0.3000221252441406, 0.310302734375]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 21.0, 144.0, 719.0, 103.0, 11.0, 6.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.988882541656494, -7.617837429046631, -7.246792316436768, -6.875747203826904, -6.504702091217041, -6.133656978607178, -5.762612342834473, -5.391567230224609, -5.020522117614746, -4.649477005004883, -4.2784318923950195, -3.9073867797851562, -3.536341667175293, -3.1652965545654297, -2.7942516803741455, -2.4232065677642822, -2.05216121673584, -1.6811161041259766, -1.3100709915161133, -0.9390259981155396, -0.5679808855056763, -0.196935772895813, 0.17410922050476074, 0.545154333114624, 0.9161994457244873, 1.2872445583343506, 1.6582896709442139, 2.029334545135498, 2.4003796577453613, 2.7714247703552246, 3.142469882965088, 3.513514995574951, 3.8845605850219727, 4.255605697631836, 4.626650810241699, 4.9976959228515625, 5.368741035461426, 5.739786148071289, 6.110831260681152, 6.481876373291016, 6.852921485900879, 7.223966598510742, 7.5950117111206055, 7.966056823730469, 8.337101936340332, 8.708147048950195, 9.079192161560059, 9.450237274169922, 9.821281433105469, 10.192326545715332, 10.563371658325195, 10.934416770935059, 11.305461883544922, 11.676506996154785, 12.047552108764648, 12.418597221374512, 12.789642333984375, 13.160687446594238, 13.531732559204102, 13.902777671813965, 14.273822784423828, 14.644867897033691, 15.015913009643555, 15.386958122253418, 15.758003234863281]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 0.0, 2.0, 1.0, 4.0, 3.0, 4.0, 2.0, 7.0, 7.0, 7.0, 10.0, 16.0, 36.0, 22.0, 20.0, 53.0, 50.0, 79.0, 68.0, 78.0, 59.0, 75.0, 91.0, 63.0, 50.0, 42.0, 38.0, 22.0, 22.0, 23.0, 17.0, 7.0, 10.0, 5.0, 1.0, 2.0, 3.0, 1.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.8769762516021729, -1.81574547290802, -1.7545145750045776, -1.6932837963104248, -1.6320528984069824, -1.5708221197128296, -1.5095913410186768, -1.4483604431152344, -1.3871296644210815, -1.3258988857269287, -1.2646679878234863, -1.2034372091293335, -1.1422063112258911, -1.0809755325317383, -1.019744634628296, -0.9585138559341431, -0.8972830176353455, -0.8360521793365479, -0.7748213410377502, -0.7135905027389526, -0.6523597240447998, -0.5911288857460022, -0.5298980474472046, -0.46866723895072937, -0.40743640065193176, -0.34620556235313416, -0.28497475385665894, -0.22374391555786133, -0.16251309216022491, -0.1012822687625885, -0.040051430463790894, 0.021179378032684326, 0.08241021633148193, 0.14364103972911835, 0.20487186312675476, 0.26610270142555237, 0.3273335099220276, 0.3885643482208252, 0.4497951865196228, 0.5110260248184204, 0.5722568035125732, 0.6334876418113708, 0.6947184801101685, 0.7559492588043213, 0.8171800971031189, 0.8784109354019165, 0.9396417737007141, 1.0008726119995117, 1.062103509902954, 1.123334288597107, 1.1845651865005493, 1.2457959651947021, 1.3070268630981445, 1.3682576417922974, 1.4294884204864502, 1.4907193183898926, 1.5519500970840454, 1.6131808757781982, 1.6744117736816406, 1.7356425523757935, 1.7968734502792358, 1.8581042289733887, 1.919335126876831, 1.9805659055709839, 2.0417966842651367]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 5.0, 11.0, 7.0, 8.0, 14.0, 22.0, 38.0, 41.0, 81.0, 122.0, 211.0, 520.0, 1474.0, 5030.0, 26348.0, 661655.0, 327686.0, 19040.0, 3937.0, 1253.0, 496.0, 214.0, 125.0, 62.0, 35.0, 15.0, 21.0, 19.0, 6.0, 11.0, 9.0, 10.0, 3.0, 2.0, 7.0, 4.0, 1.0, 0.0, 3.0, 4.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-3.40234375, -3.304901123046875, -3.20745849609375, -3.110015869140625, -3.0125732421875, -2.915130615234375, -2.81768798828125, -2.720245361328125, -2.622802734375, -2.525360107421875, -2.42791748046875, -2.330474853515625, -2.2330322265625, -2.135589599609375, -2.03814697265625, -1.940704345703125, -1.84326171875, -1.745819091796875, -1.64837646484375, -1.550933837890625, -1.4534912109375, -1.356048583984375, -1.25860595703125, -1.161163330078125, -1.063720703125, -0.966278076171875, -0.86883544921875, -0.771392822265625, -0.6739501953125, -0.576507568359375, -0.47906494140625, -0.381622314453125, -0.2841796875, -0.186737060546875, -0.08929443359375, 0.008148193359375, 0.1055908203125, 0.203033447265625, 0.30047607421875, 0.397918701171875, 0.495361328125, 0.592803955078125, 0.69024658203125, 0.787689208984375, 0.8851318359375, 0.982574462890625, 1.08001708984375, 1.177459716796875, 1.27490234375, 1.372344970703125, 1.46978759765625, 1.567230224609375, 1.6646728515625, 1.762115478515625, 1.85955810546875, 1.957000732421875, 2.054443359375, 2.151885986328125, 2.24932861328125, 2.346771240234375, 2.4442138671875, 2.541656494140625, 2.63909912109375, 2.736541748046875, 2.833984375]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 3.0, 3.0, 2.0, 7.0, 5.0, 12.0, 21.0, 28.0, 48.0, 84.0, 166.0, 233.0, 178.0, 109.0, 48.0, 19.0, 12.0, 8.0, 14.0, 3.0, 1.0, 3.0, 1.0, 0.0, 5.0, 1.0], "bins": [-0.45068359375, -0.4415550231933594, -0.43242645263671875, -0.4232978820800781, -0.4141693115234375, -0.4050407409667969, -0.39591217041015625, -0.3867835998535156, -0.377655029296875, -0.3685264587402344, -0.35939788818359375, -0.3502693176269531, -0.3411407470703125, -0.3320121765136719, -0.32288360595703125, -0.3137550354003906, -0.30462646484375, -0.2954978942871094, -0.28636932373046875, -0.2772407531738281, -0.2681121826171875, -0.2589836120605469, -0.24985504150390625, -0.24072647094726562, -0.231597900390625, -0.22246932983398438, -0.21334075927734375, -0.20421218872070312, -0.1950836181640625, -0.18595504760742188, -0.17682647705078125, -0.16769790649414062, -0.1585693359375, -0.14944076538085938, -0.14031219482421875, -0.13118362426757812, -0.1220550537109375, -0.11292648315429688, -0.10379791259765625, -0.09466934204101562, -0.085540771484375, -0.07641220092773438, -0.06728363037109375, -0.058155059814453125, -0.0490264892578125, -0.039897918701171875, -0.03076934814453125, -0.021640777587890625, -0.01251220703125, -0.003383636474609375, 0.00574493408203125, 0.014873504638671875, 0.0240020751953125, 0.033130645751953125, 0.04225921630859375, 0.051387786865234375, 0.060516357421875, 0.06964492797851562, 0.07877349853515625, 0.08790206909179688, 0.0970306396484375, 0.10615921020507812, 0.11528778076171875, 0.12441635131835938, 0.133544921875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 2.0, 2.0, 3.0, 3.0, 5.0, 4.0, 6.0, 6.0, 6.0, 5.0, 10.0, 74.0, 429.0, 9713.0, 1019463.0, 18027.0, 603.0, 89.0, 31.0, 13.0, 7.0, 8.0, 6.0, 3.0, 6.0, 4.0, 6.0, 5.0, 3.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.5078125, -5.30792236328125, -5.1080322265625, -4.90814208984375, -4.708251953125, -4.50836181640625, -4.3084716796875, -4.10858154296875, -3.90869140625, -3.70880126953125, -3.5089111328125, -3.30902099609375, -3.109130859375, -2.90924072265625, -2.7093505859375, -2.50946044921875, -2.3095703125, -2.10968017578125, -1.9097900390625, -1.70989990234375, -1.510009765625, -1.31011962890625, -1.1102294921875, -0.91033935546875, -0.71044921875, -0.51055908203125, -0.3106689453125, -0.11077880859375, 0.089111328125, 0.28900146484375, 0.4888916015625, 0.68878173828125, 0.888671875, 1.08856201171875, 1.2884521484375, 1.48834228515625, 1.688232421875, 1.88812255859375, 2.0880126953125, 2.28790283203125, 2.48779296875, 2.68768310546875, 2.8875732421875, 3.08746337890625, 3.287353515625, 3.48724365234375, 3.6871337890625, 3.88702392578125, 4.0869140625, 4.28680419921875, 4.4866943359375, 4.68658447265625, 4.886474609375, 5.08636474609375, 5.2862548828125, 5.48614501953125, 5.68603515625, 5.88592529296875, 6.0858154296875, 6.28570556640625, 6.485595703125, 6.68548583984375, 6.8853759765625, 7.08526611328125, 7.28515625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 7.0, 4.0, 1.0, 7.0, 9.0, 7.0, 7.0, 13.0, 10.0, 15.0, 23.0, 23.0, 26.0, 22.0, 30.0, 43.0, 32.0, 35.0, 35.0, 48.0, 46.0, 43.0, 47.0, 44.0, 41.0, 41.0, 34.0, 44.0, 35.0, 31.0, 28.0, 24.0, 29.0, 29.0, 14.0, 10.0, 19.0, 11.0, 11.0, 4.0, 5.0, 5.0, 1.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0], "bins": [-0.61083984375, -0.5923233032226562, -0.5738067626953125, -0.5552902221679688, -0.536773681640625, -0.5182571411132812, -0.4997406005859375, -0.48122406005859375, -0.46270751953125, -0.44419097900390625, -0.4256744384765625, -0.40715789794921875, -0.388641357421875, -0.37012481689453125, -0.3516082763671875, -0.33309173583984375, -0.3145751953125, -0.29605865478515625, -0.2775421142578125, -0.25902557373046875, -0.240509033203125, -0.22199249267578125, -0.2034759521484375, -0.18495941162109375, -0.16644287109375, -0.14792633056640625, -0.1294097900390625, -0.11089324951171875, -0.092376708984375, -0.07386016845703125, -0.0553436279296875, -0.03682708740234375, -0.018310546875, 0.00020599365234375, 0.0187225341796875, 0.03723907470703125, 0.055755615234375, 0.07427215576171875, 0.0927886962890625, 0.11130523681640625, 0.12982177734375, 0.14833831787109375, 0.1668548583984375, 0.18537139892578125, 0.203887939453125, 0.22240447998046875, 0.2409210205078125, 0.25943756103515625, 0.2779541015625, 0.29647064208984375, 0.3149871826171875, 0.33350372314453125, 0.352020263671875, 0.37053680419921875, 0.3890533447265625, 0.40756988525390625, 0.42608642578125, 0.44460296630859375, 0.4631195068359375, 0.48163604736328125, 0.500152587890625, 0.5186691284179688, 0.5371856689453125, 0.5557022094726562, 0.57421875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 6.0, 6.0, 21.0, 75.0, 461.0, 1043842.0, 3958.0, 135.0, 19.0, 15.0, 8.0, 4.0, 3.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.171875, -25.070556640625, -23.96923828125, -22.867919921875, -21.7666015625, -20.665283203125, -19.56396484375, -18.462646484375, -17.361328125, -16.260009765625, -15.15869140625, -14.057373046875, -12.9560546875, -11.854736328125, -10.75341796875, -9.652099609375, -8.55078125, -7.449462890625, -6.34814453125, -5.246826171875, -4.1455078125, -3.044189453125, -1.94287109375, -0.841552734375, 0.259765625, 1.361083984375, 2.46240234375, 3.563720703125, 4.6650390625, 5.766357421875, 6.86767578125, 7.968994140625, 9.0703125, 10.171630859375, 11.27294921875, 12.374267578125, 13.4755859375, 14.576904296875, 15.67822265625, 16.779541015625, 17.880859375, 18.982177734375, 20.08349609375, 21.184814453125, 22.2861328125, 23.387451171875, 24.48876953125, 25.590087890625, 26.69140625, 27.792724609375, 28.89404296875, 29.995361328125, 31.0966796875, 32.197998046875, 33.29931640625, 34.400634765625, 35.501953125, 36.603271484375, 37.70458984375, 38.805908203125, 39.9072265625, 41.008544921875, 42.10986328125, 43.211181640625, 44.3125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 9.0, 3.0, 6.0, 13.0, 20.0, 18.0, 40.0, 59.0, 77.0, 102.0, 130.0, 123.0, 107.0, 84.0, 65.0, 46.0, 28.0, 19.0, 15.0, 10.0, 4.0, 9.0, 8.0, 6.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00010526180267333984, -0.00010225921869277954, -9.925663471221924e-05, -9.625405073165894e-05, -9.325146675109863e-05, -9.024888277053833e-05, -8.724629878997803e-05, -8.424371480941772e-05, -8.124113082885742e-05, -7.823854684829712e-05, -7.523596286773682e-05, -7.223337888717651e-05, -6.923079490661621e-05, -6.622821092605591e-05, -6.32256269454956e-05, -6.02230429649353e-05, -5.7220458984375e-05, -5.42178750038147e-05, -5.1215291023254395e-05, -4.821270704269409e-05, -4.521012306213379e-05, -4.2207539081573486e-05, -3.9204955101013184e-05, -3.620237112045288e-05, -3.319978713989258e-05, -3.0197203159332275e-05, -2.7194619178771973e-05, -2.419203519821167e-05, -2.1189451217651367e-05, -1.8186867237091064e-05, -1.5184283256530762e-05, -1.2181699275970459e-05, -9.179115295410156e-06, -6.1765313148498535e-06, -3.1739473342895508e-06, -1.7136335372924805e-07, 2.8312206268310547e-06, 5.833804607391357e-06, 8.83638858795166e-06, 1.1838972568511963e-05, 1.4841556549072266e-05, 1.784414052963257e-05, 2.084672451019287e-05, 2.3849308490753174e-05, 2.6851892471313477e-05, 2.985447645187378e-05, 3.285706043243408e-05, 3.5859644412994385e-05, 3.886222839355469e-05, 4.186481237411499e-05, 4.486739635467529e-05, 4.7869980335235596e-05, 5.08725643157959e-05, 5.38751482963562e-05, 5.6877732276916504e-05, 5.988031625747681e-05, 6.288290023803711e-05, 6.588548421859741e-05, 6.888806819915771e-05, 7.189065217971802e-05, 7.489323616027832e-05, 7.789582014083862e-05, 8.089840412139893e-05, 8.390098810195923e-05, 8.690357208251953e-05]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 8.0, 11.0, 17.0, 27.0, 38.0, 76.0, 104.0, 229.0, 804.0, 5921.0, 941538.0, 96125.0, 2822.0, 520.0, 151.0, 66.0, 45.0, 18.0, 18.0, 11.0, 3.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.59375, -5.42333984375, -5.2529296875, -5.08251953125, -4.912109375, -4.74169921875, -4.5712890625, -4.40087890625, -4.23046875, -4.06005859375, -3.8896484375, -3.71923828125, -3.548828125, -3.37841796875, -3.2080078125, -3.03759765625, -2.8671875, -2.69677734375, -2.5263671875, -2.35595703125, -2.185546875, -2.01513671875, -1.8447265625, -1.67431640625, -1.50390625, -1.33349609375, -1.1630859375, -0.99267578125, -0.822265625, -0.65185546875, -0.4814453125, -0.31103515625, -0.140625, 0.02978515625, 0.2001953125, 0.37060546875, 0.541015625, 0.71142578125, 0.8818359375, 1.05224609375, 1.22265625, 1.39306640625, 1.5634765625, 1.73388671875, 1.904296875, 2.07470703125, 2.2451171875, 2.41552734375, 2.5859375, 2.75634765625, 2.9267578125, 3.09716796875, 3.267578125, 3.43798828125, 3.6083984375, 3.77880859375, 3.94921875, 4.11962890625, 4.2900390625, 4.46044921875, 4.630859375, 4.80126953125, 4.9716796875, 5.14208984375, 5.3125]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 4.0, 4.0, 3.0, 6.0, 8.0, 49.0, 185.0, 381.0, 247.0, 73.0, 26.0, 8.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-4.03125, -3.9448089599609375, -3.858367919921875, -3.7719268798828125, -3.68548583984375, -3.5990447998046875, -3.512603759765625, -3.4261627197265625, -3.3397216796875, -3.2532806396484375, -3.166839599609375, -3.0803985595703125, -2.99395751953125, -2.9075164794921875, -2.821075439453125, -2.7346343994140625, -2.648193359375, -2.5617523193359375, -2.475311279296875, -2.3888702392578125, -2.30242919921875, -2.2159881591796875, -2.129547119140625, -2.0431060791015625, -1.9566650390625, -1.8702239990234375, -1.783782958984375, -1.6973419189453125, -1.61090087890625, -1.5244598388671875, -1.438018798828125, -1.3515777587890625, -1.26513671875, -1.1786956787109375, -1.092254638671875, -1.0058135986328125, -0.91937255859375, -0.8329315185546875, -0.746490478515625, -0.6600494384765625, -0.5736083984375, -0.4871673583984375, -0.400726318359375, -0.3142852783203125, -0.22784423828125, -0.1414031982421875, -0.054962158203125, 0.0314788818359375, 0.117919921875, 0.2043609619140625, 0.290802001953125, 0.3772430419921875, 0.46368408203125, 0.5501251220703125, 0.636566162109375, 0.7230072021484375, 0.8094482421875, 0.8958892822265625, 0.982330322265625, 1.0687713623046875, 1.15521240234375, 1.2416534423828125, 1.328094482421875, 1.4145355224609375, 1.5009765625]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 10.0, 16.0, 72.0, 590.0, 299.0, 18.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-58.646339416503906, -57.53834533691406, -56.430355072021484, -55.32236099243164, -54.21437072753906, -53.10637664794922, -51.998382568359375, -50.8903923034668, -49.78239822387695, -48.67440414428711, -47.56641387939453, -46.45841979980469, -45.35042953491211, -44.242435455322266, -43.13444519042969, -42.026451110839844, -40.91845703125, -39.810462951660156, -38.70247268676758, -37.594478607177734, -36.486488342285156, -35.37849426269531, -34.27050018310547, -33.16250991821289, -32.05451965332031, -30.9465274810791, -29.83853530883789, -28.730541229248047, -27.622549057006836, -26.514556884765625, -25.406564712524414, -24.298572540283203, -23.190580368041992, -22.08258819580078, -20.97459602355957, -19.86660385131836, -18.758609771728516, -17.650617599487305, -16.542625427246094, -15.434633255004883, -14.326640129089355, -13.218647956848145, -12.110654830932617, -11.002662658691406, -9.894670486450195, -8.786677360534668, -7.678685188293457, -6.570692539215088, -5.462699890136719, -4.35470724105835, -3.2467148303985596, -2.1387224197387695, -1.0307297706604004, 0.07726287841796875, 1.1852550506591797, 2.293247699737549, 3.401240348815918, 4.509232997894287, 5.617225646972656, 6.725217819213867, 7.833210468292236, 8.941203117370605, 10.049195289611816, 11.157188415527344, 12.265180587768555]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 4.0, 5.0, 7.0, 10.0, 9.0, 6.0, 19.0, 17.0, 43.0, 35.0, 59.0, 53.0, 81.0, 72.0, 91.0, 79.0, 73.0, 63.0, 52.0, 61.0, 38.0, 30.0, 28.0, 24.0, 6.0, 11.0, 14.0, 3.0, 2.0, 3.0, 3.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.4281415939331055, -7.18755578994751, -6.946969509124756, -6.70638370513916, -6.465797424316406, -6.2252116203308105, -5.984625816345215, -5.744039535522461, -5.503453731536865, -5.2628679275512695, -5.022281646728516, -4.78169584274292, -4.541110038757324, -4.30052375793457, -4.059937953948975, -3.8193519115448, -3.578765869140625, -3.33817982673645, -3.0975937843322754, -2.8570079803466797, -2.616421937942505, -2.37583589553833, -2.1352500915527344, -1.8946640491485596, -1.6540780067443848, -1.41349196434021, -1.1729060411453247, -0.9323200583457947, -0.6917340755462646, -0.45114803314208984, -0.2105621099472046, 0.030023813247680664, 0.27060937881469727, 0.5111953616142273, 0.7517813444137573, 0.9923673272132874, 1.2329533100128174, 1.4735393524169922, 1.7141252756118774, 1.9547111988067627, 2.1952972412109375, 2.4358832836151123, 2.676469326019287, 2.917055130004883, 3.1576411724090576, 3.3982272148132324, 3.638813018798828, 3.879399061203003, 4.119985103607178, 4.360570907592773, 4.601157188415527, 4.841742992401123, 5.082328796386719, 5.322915077209473, 5.563500881195068, 5.804086685180664, 6.044672966003418, 6.285258769989014, 6.525845050811768, 6.766430854797363, 7.007017135620117, 7.247602939605713, 7.488188743591309, 7.7287750244140625, 7.969360828399658]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 5.0, 4.0, 6.0, 13.0, 11.0, 17.0, 23.0, 24.0, 34.0, 39.0, 55.0, 70.0, 83.0, 107.0, 145.0, 213.0, 348.0, 486.0, 789.0, 1263.0, 2377.0, 4719.0, 12087.0, 51772.0, 3801387.0, 278237.0, 24519.0, 7886.0, 3176.0, 1562.0, 932.0, 562.0, 374.0, 300.0, 191.0, 145.0, 95.0, 55.0, 57.0, 27.0, 30.0, 16.0, 10.0, 9.0, 9.0, 8.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0], "bins": [-3.44921875, -3.352813720703125, -3.25640869140625, -3.160003662109375, -3.0635986328125, -2.967193603515625, -2.87078857421875, -2.774383544921875, -2.677978515625, -2.581573486328125, -2.48516845703125, -2.388763427734375, -2.2923583984375, -2.195953369140625, -2.09954833984375, -2.003143310546875, -1.90673828125, -1.810333251953125, -1.71392822265625, -1.617523193359375, -1.5211181640625, -1.424713134765625, -1.32830810546875, -1.231903076171875, -1.135498046875, -1.039093017578125, -0.94268798828125, -0.846282958984375, -0.7498779296875, -0.653472900390625, -0.55706787109375, -0.460662841796875, -0.3642578125, -0.267852783203125, -0.17144775390625, -0.075042724609375, 0.0213623046875, 0.117767333984375, 0.21417236328125, 0.310577392578125, 0.406982421875, 0.503387451171875, 0.59979248046875, 0.696197509765625, 0.7926025390625, 0.889007568359375, 0.98541259765625, 1.081817626953125, 1.17822265625, 1.274627685546875, 1.37103271484375, 1.467437744140625, 1.5638427734375, 1.660247802734375, 1.75665283203125, 1.853057861328125, 1.949462890625, 2.045867919921875, 2.14227294921875, 2.238677978515625, 2.3350830078125, 2.431488037109375, 2.52789306640625, 2.624298095703125, 2.720703125]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 4.0, 6.0, 6.0, 8.0, 11.0, 17.0, 20.0, 14.0, 38.0, 44.0, 79.0, 106.0, 120.0, 114.0, 94.0, 88.0, 55.0, 53.0, 29.0, 23.0, 17.0, 10.0, 5.0, 4.0, 3.0, 8.0, 4.0, 3.0, 2.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1702880859375, -0.16558456420898438, -0.16088104248046875, -0.15617752075195312, -0.1514739990234375, -0.14677047729492188, -0.14206695556640625, -0.13736343383789062, -0.132659912109375, -0.12795639038085938, -0.12325286865234375, -0.11854934692382812, -0.1138458251953125, -0.10914230346679688, -0.10443878173828125, -0.09973526000976562, -0.09503173828125, -0.09032821655273438, -0.08562469482421875, -0.08092117309570312, -0.0762176513671875, -0.07151412963867188, -0.06681060791015625, -0.062107086181640625, -0.057403564453125, -0.052700042724609375, -0.04799652099609375, -0.043292999267578125, -0.0385894775390625, -0.033885955810546875, -0.02918243408203125, -0.024478912353515625, -0.019775390625, -0.015071868896484375, -0.01036834716796875, -0.005664825439453125, -0.0009613037109375, 0.003742218017578125, 0.00844573974609375, 0.013149261474609375, 0.017852783203125, 0.022556304931640625, 0.02725982666015625, 0.031963348388671875, 0.0366668701171875, 0.041370391845703125, 0.04607391357421875, 0.050777435302734375, 0.05548095703125, 0.060184478759765625, 0.06488800048828125, 0.06959152221679688, 0.0742950439453125, 0.07899856567382812, 0.08370208740234375, 0.08840560913085938, 0.093109130859375, 0.09781265258789062, 0.10251617431640625, 0.10721969604492188, 0.1119232177734375, 0.11662673950195312, 0.12133026123046875, 0.12603378295898438, 0.1307373046875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 1.0, 4.0, 9.0, 6.0, 7.0, 19.0, 31.0, 41.0, 56.0, 134.0, 721.0, 22410.0, 4157879.0, 12233.0, 491.0, 102.0, 46.0, 31.0, 15.0, 11.0, 9.0, 6.0, 4.0, 4.0, 3.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-11.765625, -11.47467041015625, -11.1837158203125, -10.89276123046875, -10.601806640625, -10.31085205078125, -10.0198974609375, -9.72894287109375, -9.43798828125, -9.14703369140625, -8.8560791015625, -8.56512451171875, -8.274169921875, -7.98321533203125, -7.6922607421875, -7.40130615234375, -7.1103515625, -6.81939697265625, -6.5284423828125, -6.23748779296875, -5.946533203125, -5.65557861328125, -5.3646240234375, -5.07366943359375, -4.78271484375, -4.49176025390625, -4.2008056640625, -3.90985107421875, -3.618896484375, -3.32794189453125, -3.0369873046875, -2.74603271484375, -2.455078125, -2.16412353515625, -1.8731689453125, -1.58221435546875, -1.291259765625, -1.00030517578125, -0.7093505859375, -0.41839599609375, -0.12744140625, 0.16351318359375, 0.4544677734375, 0.74542236328125, 1.036376953125, 1.32733154296875, 1.6182861328125, 1.90924072265625, 2.2001953125, 2.49114990234375, 2.7821044921875, 3.07305908203125, 3.364013671875, 3.65496826171875, 3.9459228515625, 4.23687744140625, 4.52783203125, 4.81878662109375, 5.1097412109375, 5.40069580078125, 5.691650390625, 5.98260498046875, 6.2735595703125, 6.56451416015625, 6.85546875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 4.0, 8.0, 3.0, 6.0, 9.0, 5.0, 15.0, 12.0, 25.0, 31.0, 44.0, 74.0, 129.0, 245.0, 880.0, 1456.0, 508.0, 227.0, 131.0, 68.0, 59.0, 35.0, 22.0, 17.0, 12.0, 4.0, 9.0, 0.0, 5.0, 6.0, 2.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.277099609375, -0.26849365234375, -0.2598876953125, -0.25128173828125, -0.24267578125, -0.23406982421875, -0.2254638671875, -0.21685791015625, -0.208251953125, -0.19964599609375, -0.1910400390625, -0.18243408203125, -0.173828125, -0.16522216796875, -0.1566162109375, -0.14801025390625, -0.139404296875, -0.13079833984375, -0.1221923828125, -0.11358642578125, -0.10498046875, -0.09637451171875, -0.0877685546875, -0.07916259765625, -0.070556640625, -0.06195068359375, -0.0533447265625, -0.04473876953125, -0.0361328125, -0.02752685546875, -0.0189208984375, -0.01031494140625, -0.001708984375, 0.00689697265625, 0.0155029296875, 0.02410888671875, 0.03271484375, 0.04132080078125, 0.0499267578125, 0.05853271484375, 0.067138671875, 0.07574462890625, 0.0843505859375, 0.09295654296875, 0.1015625, 0.11016845703125, 0.1187744140625, 0.12738037109375, 0.135986328125, 0.14459228515625, 0.1531982421875, 0.16180419921875, 0.17041015625, 0.17901611328125, 0.1876220703125, 0.19622802734375, 0.204833984375, 0.21343994140625, 0.2220458984375, 0.23065185546875, 0.2392578125, 0.24786376953125, 0.2564697265625, 0.26507568359375, 0.273681640625]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 19.0, 547.0, 434.0, 15.0, 2.0, 4.0], "bins": [-28.242290496826172, -27.77063751220703, -27.298982620239258, -26.827329635620117, -26.355674743652344, -25.884021759033203, -25.412368774414062, -24.94071388244629, -24.46906089782715, -23.997407913208008, -23.525753021240234, -23.054100036621094, -22.58244514465332, -22.11079216003418, -21.63913917541504, -21.167484283447266, -20.695831298828125, -20.224178314208984, -19.75252342224121, -19.28087043762207, -18.809215545654297, -18.337562561035156, -17.865909576416016, -17.394254684448242, -16.9226016998291, -16.45094871520996, -15.979293823242188, -15.507640838623047, -15.03598690032959, -14.564332962036133, -14.092679023742676, -13.621025085449219, -13.149371147155762, -12.677717208862305, -12.206063270568848, -11.734410285949707, -11.26275634765625, -10.791102409362793, -10.319448471069336, -9.847795486450195, -9.376141548156738, -8.904487609863281, -8.432833671569824, -7.961180210113525, -7.489526748657227, -7.0178728103637695, -6.5462188720703125, -6.074565410614014, -5.602911949157715, -5.131258010864258, -4.659604549407959, -4.187950611114502, -3.716297149658203, -3.244643211364746, -2.772989511489868, -2.3013358116149902, -1.8296818733215332, -1.3580281734466553, -0.8863744139671326, -0.41472065448760986, 0.056933045387268066, 0.5285868644714355, 1.0002405643463135, 1.4718942642211914, 1.9435479640960693]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 9.0, 5.0, 13.0, 16.0, 52.0, 101.0, 164.0, 233.0, 202.0, 109.0, 59.0, 34.0, 7.0, 6.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.082638740539551, -4.971395015716553, -4.860151290893555, -4.748907566070557, -4.637663841247559, -4.5264201164245605, -4.4151763916015625, -4.3039326667785645, -4.192688941955566, -4.081445217132568, -3.9702014923095703, -3.8589577674865723, -3.747714042663574, -3.636470317840576, -3.525226593017578, -3.41398286819458, -3.302739143371582, -3.191495418548584, -3.080251693725586, -2.969007968902588, -2.85776424407959, -2.746520519256592, -2.6352767944335938, -2.5240330696105957, -2.4127893447875977, -2.3015456199645996, -2.1903018951416016, -2.0790581703186035, -1.9678144454956055, -1.8565707206726074, -1.7453269958496094, -1.6340832710266113, -1.5228395462036133, -1.4115958213806152, -1.3003520965576172, -1.1891083717346191, -1.077864646911621, -0.966620922088623, -0.855377197265625, -0.744133472442627, -0.6328897476196289, -0.5216460227966309, -0.4104022979736328, -0.29915857315063477, -0.18791484832763672, -0.07667112350463867, 0.034572601318359375, 0.14581632614135742, 0.25706005096435547, 0.3683037757873535, 0.47954750061035156, 0.5907912254333496, 0.7020349502563477, 0.8132786750793457, 0.9245223999023438, 1.0357661247253418, 1.1470098495483398, 1.258253574371338, 1.369497299194336, 1.480741024017334, 1.591984748840332, 1.70322847366333, 1.8144721984863281, 1.9257159233093262, 2.036959648132324]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 4.0, 1.0, 3.0, 2.0, 1.0, 6.0, 4.0, 10.0, 11.0, 5.0, 13.0, 16.0, 20.0, 17.0, 26.0, 30.0, 36.0, 47.0, 68.0, 116.0, 756.0, 245010.0, 800609.0, 1252.0, 119.0, 72.0, 53.0, 36.0, 43.0, 30.0, 29.0, 23.0, 18.0, 15.0, 17.0, 12.0, 7.0, 3.0, 6.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.7578125, -7.5081787109375, -7.258544921875, -7.0089111328125, -6.75927734375, -6.5096435546875, -6.260009765625, -6.0103759765625, -5.7607421875, -5.5111083984375, -5.261474609375, -5.0118408203125, -4.76220703125, -4.5125732421875, -4.262939453125, -4.0133056640625, -3.763671875, -3.5140380859375, -3.264404296875, -3.0147705078125, -2.76513671875, -2.5155029296875, -2.265869140625, -2.0162353515625, -1.7666015625, -1.5169677734375, -1.267333984375, -1.0177001953125, -0.76806640625, -0.5184326171875, -0.268798828125, -0.0191650390625, 0.23046875, 0.4801025390625, 0.729736328125, 0.9793701171875, 1.22900390625, 1.4786376953125, 1.728271484375, 1.9779052734375, 2.2275390625, 2.4771728515625, 2.726806640625, 2.9764404296875, 3.22607421875, 3.4757080078125, 3.725341796875, 3.9749755859375, 4.224609375, 4.4742431640625, 4.723876953125, 4.9735107421875, 5.22314453125, 5.4727783203125, 5.722412109375, 5.9720458984375, 6.2216796875, 6.4713134765625, 6.720947265625, 6.9705810546875, 7.22021484375, 7.4698486328125, 7.719482421875, 7.9691162109375, 8.21875]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 9.0, 53.0, 231.0, 478.0, 196.0, 35.0, 4.0, 6.0, 2.0, 1.0], "bins": [-1.27734375, -1.2550792694091797, -1.2328147888183594, -1.210550308227539, -1.1882858276367188, -1.1660213470458984, -1.1437568664550781, -1.1214923858642578, -1.0992279052734375, -1.0769634246826172, -1.0546989440917969, -1.0324344635009766, -1.0101699829101562, -0.9879055023193359, -0.9656410217285156, -0.9433765411376953, -0.921112060546875, -0.8988475799560547, -0.8765830993652344, -0.8543186187744141, -0.8320541381835938, -0.8097896575927734, -0.7875251770019531, -0.7652606964111328, -0.7429962158203125, -0.7207317352294922, -0.6984672546386719, -0.6762027740478516, -0.6539382934570312, -0.6316738128662109, -0.6094093322753906, -0.5871448516845703, -0.56488037109375, -0.5426158905029297, -0.5203514099121094, -0.49808692932128906, -0.47582244873046875, -0.45355796813964844, -0.4312934875488281, -0.4090290069580078, -0.3867645263671875, -0.3645000457763672, -0.3422355651855469, -0.31997108459472656, -0.29770660400390625, -0.27544212341308594, -0.2531776428222656, -0.2309131622314453, -0.208648681640625, -0.1863842010498047, -0.16411972045898438, -0.14185523986816406, -0.11959075927734375, -0.09732627868652344, -0.07506179809570312, -0.05279731750488281, -0.0305328369140625, -0.008268356323242188, 0.013996124267578125, 0.03626060485839844, 0.05852508544921875, 0.08078956604003906, 0.10305404663085938, 0.1253185272216797, 0.1475830078125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 8.0, 5.0, 7.0, 11.0, 18.0, 17.0, 28.0, 28.0, 48.0, 62.0, 93.0, 123.0, 189.0, 275.0, 517.0, 992.0, 1985.0, 4495.0, 12779.0, 40388.0, 147559.0, 431883.0, 290302.0, 79580.0, 23140.0, 7725.0, 3013.0, 1361.0, 704.0, 421.0, 234.0, 149.0, 137.0, 86.0, 50.0, 33.0, 26.0, 20.0, 20.0, 15.0, 7.0, 3.0, 6.0, 6.0, 7.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.4794921875, -1.4343414306640625, -1.389190673828125, -1.3440399169921875, -1.29888916015625, -1.2537384033203125, -1.208587646484375, -1.1634368896484375, -1.1182861328125, -1.0731353759765625, -1.027984619140625, -0.9828338623046875, -0.93768310546875, -0.8925323486328125, -0.847381591796875, -0.8022308349609375, -0.757080078125, -0.7119293212890625, -0.666778564453125, -0.6216278076171875, -0.57647705078125, -0.5313262939453125, -0.486175537109375, -0.4410247802734375, -0.3958740234375, -0.3507232666015625, -0.305572509765625, -0.2604217529296875, -0.21527099609375, -0.1701202392578125, -0.124969482421875, -0.0798187255859375, -0.03466796875, 0.0104827880859375, 0.055633544921875, 0.1007843017578125, 0.14593505859375, 0.1910858154296875, 0.236236572265625, 0.2813873291015625, 0.3265380859375, 0.3716888427734375, 0.416839599609375, 0.4619903564453125, 0.50714111328125, 0.5522918701171875, 0.597442626953125, 0.6425933837890625, 0.687744140625, 0.7328948974609375, 0.778045654296875, 0.8231964111328125, 0.86834716796875, 0.9134979248046875, 0.958648681640625, 1.0037994384765625, 1.0489501953125, 1.0941009521484375, 1.139251708984375, 1.1844024658203125, 1.22955322265625, 1.2747039794921875, 1.319854736328125, 1.3650054931640625, 1.41015625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 5.0, 1.0, 7.0, 9.0, 7.0, 12.0, 16.0, 11.0, 28.0, 22.0, 23.0, 36.0, 37.0, 50.0, 53.0, 42.0, 52.0, 52.0, 63.0, 61.0, 50.0, 40.0, 45.0, 45.0, 32.0, 36.0, 31.0, 22.0, 22.0, 20.0, 14.0, 18.0, 12.0, 8.0, 8.0, 5.0, 7.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.93408203125, -0.9005355834960938, -0.8669891357421875, -0.8334426879882812, -0.799896240234375, -0.7663497924804688, -0.7328033447265625, -0.6992568969726562, -0.66571044921875, -0.6321640014648438, -0.5986175537109375, -0.5650711059570312, -0.531524658203125, -0.49797821044921875, -0.4644317626953125, -0.43088531494140625, -0.3973388671875, -0.36379241943359375, -0.3302459716796875, -0.29669952392578125, -0.263153076171875, -0.22960662841796875, -0.1960601806640625, -0.16251373291015625, -0.12896728515625, -0.09542083740234375, -0.0618743896484375, -0.02832794189453125, 0.005218505859375, 0.03876495361328125, 0.0723114013671875, 0.10585784912109375, 0.139404296875, 0.17295074462890625, 0.2064971923828125, 0.24004364013671875, 0.273590087890625, 0.30713653564453125, 0.3406829833984375, 0.37422943115234375, 0.40777587890625, 0.44132232666015625, 0.4748687744140625, 0.5084152221679688, 0.541961669921875, 0.5755081176757812, 0.6090545654296875, 0.6426010131835938, 0.6761474609375, 0.7096939086914062, 0.7432403564453125, 0.7767868041992188, 0.810333251953125, 0.8438796997070312, 0.8774261474609375, 0.9109725952148438, 0.94451904296875, 0.9780654907226562, 1.0116119384765625, 1.0451583862304688, 1.078704833984375, 1.1122512817382812, 1.1457977294921875, 1.1793441772460938, 1.212890625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 8.0, 8.0, 5.0, 12.0, 13.0, 14.0, 30.0, 41.0, 43.0, 109.0, 162.0, 331.0, 822.0, 2208.0, 8584.0, 81433.0, 888181.0, 55884.0, 7248.0, 1967.0, 719.0, 317.0, 165.0, 81.0, 49.0, 41.0, 23.0, 9.0, 18.0, 9.0, 3.0, 4.0, 5.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.740234375, -3.62127685546875, -3.5023193359375, -3.38336181640625, -3.264404296875, -3.14544677734375, -3.0264892578125, -2.90753173828125, -2.78857421875, -2.66961669921875, -2.5506591796875, -2.43170166015625, -2.312744140625, -2.19378662109375, -2.0748291015625, -1.95587158203125, -1.8369140625, -1.71795654296875, -1.5989990234375, -1.48004150390625, -1.361083984375, -1.24212646484375, -1.1231689453125, -1.00421142578125, -0.88525390625, -0.76629638671875, -0.6473388671875, -0.52838134765625, -0.409423828125, -0.29046630859375, -0.1715087890625, -0.05255126953125, 0.06640625, 0.18536376953125, 0.3043212890625, 0.42327880859375, 0.542236328125, 0.66119384765625, 0.7801513671875, 0.89910888671875, 1.01806640625, 1.13702392578125, 1.2559814453125, 1.37493896484375, 1.493896484375, 1.61285400390625, 1.7318115234375, 1.85076904296875, 1.9697265625, 2.08868408203125, 2.2076416015625, 2.32659912109375, 2.445556640625, 2.56451416015625, 2.6834716796875, 2.80242919921875, 2.92138671875, 3.04034423828125, 3.1593017578125, 3.27825927734375, 3.397216796875, 3.51617431640625, 3.6351318359375, 3.75408935546875, 3.873046875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 0.0, 4.0, 6.0, 6.0, 6.0, 14.0, 9.0, 14.0, 42.0, 62.0, 151.0, 223.0, 202.0, 123.0, 58.0, 31.0, 23.0, 11.0, 7.0, 4.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005292892456054688, -0.0005163475871086121, -0.0005034059286117554, -0.0004904642701148987, -0.000477522611618042, -0.0004645809531211853, -0.0004516392946243286, -0.0004386976361274719, -0.00042575597763061523, -0.00041281431913375854, -0.00039987266063690186, -0.00038693100214004517, -0.0003739893436431885, -0.0003610476851463318, -0.0003481060266494751, -0.0003351643681526184, -0.0003222227096557617, -0.00030928105115890503, -0.00029633939266204834, -0.00028339773416519165, -0.00027045607566833496, -0.00025751441717147827, -0.0002445727586746216, -0.0002316311001777649, -0.0002186894416809082, -0.00020574778318405151, -0.00019280612468719482, -0.00017986446619033813, -0.00016692280769348145, -0.00015398114919662476, -0.00014103949069976807, -0.00012809783220291138, -0.00011515617370605469, -0.000102214515209198, -8.927285671234131e-05, -7.633119821548462e-05, -6.338953971862793e-05, -5.044788122177124e-05, -3.750622272491455e-05, -2.456456422805786e-05, -1.1622905731201172e-05, 1.3187527656555176e-06, 1.4260411262512207e-05, 2.7202069759368896e-05, 4.0143728256225586e-05, 5.3085386753082275e-05, 6.602704524993896e-05, 7.896870374679565e-05, 9.191036224365234e-05, 0.00010485202074050903, 0.00011779367923736572, 0.0001307353377342224, 0.0001436769962310791, 0.0001566186547279358, 0.00016956031322479248, 0.00018250197172164917, 0.00019544363021850586, 0.00020838528871536255, 0.00022132694721221924, 0.00023426860570907593, 0.0002472102642059326, 0.0002601519227027893, 0.000273093581199646, 0.0002860352396965027, 0.0002989768981933594]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 1.0, 4.0, 5.0, 9.0, 9.0, 24.0, 41.0, 63.0, 96.0, 229.0, 570.0, 1546.0, 5988.0, 152720.0, 873650.0, 9924.0, 2215.0, 740.0, 374.0, 159.0, 84.0, 49.0, 24.0, 10.0, 6.0, 6.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-11.453125, -11.167724609375, -10.88232421875, -10.596923828125, -10.3115234375, -10.026123046875, -9.74072265625, -9.455322265625, -9.169921875, -8.884521484375, -8.59912109375, -8.313720703125, -8.0283203125, -7.742919921875, -7.45751953125, -7.172119140625, -6.88671875, -6.601318359375, -6.31591796875, -6.030517578125, -5.7451171875, -5.459716796875, -5.17431640625, -4.888916015625, -4.603515625, -4.318115234375, -4.03271484375, -3.747314453125, -3.4619140625, -3.176513671875, -2.89111328125, -2.605712890625, -2.3203125, -2.034912109375, -1.74951171875, -1.464111328125, -1.1787109375, -0.893310546875, -0.60791015625, -0.322509765625, -0.037109375, 0.248291015625, 0.53369140625, 0.819091796875, 1.1044921875, 1.389892578125, 1.67529296875, 1.960693359375, 2.24609375, 2.531494140625, 2.81689453125, 3.102294921875, 3.3876953125, 3.673095703125, 3.95849609375, 4.243896484375, 4.529296875, 4.814697265625, 5.10009765625, 5.385498046875, 5.6708984375, 5.956298828125, 6.24169921875, 6.527099609375, 6.8125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 2.0, 1.0, 4.0, 12.0, 5.0, 9.0, 20.0, 42.0, 87.0, 245.0, 286.0, 161.0, 57.0, 20.0, 14.0, 8.0, 7.0, 1.0, 8.0, 6.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.83984375, -1.75701904296875, -1.6741943359375, -1.59136962890625, -1.508544921875, -1.42572021484375, -1.3428955078125, -1.26007080078125, -1.17724609375, -1.09442138671875, -1.0115966796875, -0.92877197265625, -0.845947265625, -0.76312255859375, -0.6802978515625, -0.59747314453125, -0.5146484375, -0.43182373046875, -0.3489990234375, -0.26617431640625, -0.183349609375, -0.10052490234375, -0.0177001953125, 0.06512451171875, 0.14794921875, 0.23077392578125, 0.3135986328125, 0.39642333984375, 0.479248046875, 0.56207275390625, 0.6448974609375, 0.72772216796875, 0.810546875, 0.89337158203125, 0.9761962890625, 1.05902099609375, 1.141845703125, 1.22467041015625, 1.3074951171875, 1.39031982421875, 1.47314453125, 1.55596923828125, 1.6387939453125, 1.72161865234375, 1.804443359375, 1.88726806640625, 1.9700927734375, 2.05291748046875, 2.1357421875, 2.21856689453125, 2.3013916015625, 2.38421630859375, 2.467041015625, 2.54986572265625, 2.6326904296875, 2.71551513671875, 2.79833984375, 2.88116455078125, 2.9639892578125, 3.04681396484375, 3.129638671875, 3.21246337890625, 3.2952880859375, 3.37811279296875, 3.4609375]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 85.0, 836.0, 73.0, 12.0, 6.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-155.31600952148438, -152.4038848876953, -149.49176025390625, -146.57962036132812, -143.66749572753906, -140.75537109375, -137.84324645996094, -134.9311065673828, -132.01898193359375, -129.1068572998047, -126.1947250366211, -123.28260040283203, -120.37046813964844, -117.45834350585938, -114.54621124267578, -111.63408660888672, -108.72195434570312, -105.80982971191406, -102.89769744873047, -99.9855728149414, -97.07344055175781, -94.16131591796875, -91.24918365478516, -88.3370590209961, -85.42493438720703, -82.51280975341797, -79.60067749023438, -76.68855285644531, -73.77642059326172, -70.86429595947266, -67.95216369628906, -65.0400390625, -62.12791442871094, -59.21578598022461, -56.30365753173828, -53.39152908325195, -50.479400634765625, -47.5672721862793, -44.65514373779297, -41.743019104003906, -38.83088684082031, -35.918758392333984, -33.006629943847656, -30.094501495361328, -27.182373046875, -24.270244598388672, -21.358118057250977, -18.44598960876465, -15.53386116027832, -12.621732711791992, -9.709604263305664, -6.797476768493652, -3.885348320007324, -0.9732198715209961, 1.9389076232910156, 4.851036071777344, 7.763164520263672, 10.67529296875, 13.587421417236328, 16.499549865722656, 19.411678314208984, 22.323806762695312, 25.235933303833008, 28.148061752319336, 31.060190200805664]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 6.0, 11.0, 26.0, 47.0, 69.0, 76.0, 116.0, 112.0, 109.0, 115.0, 94.0, 69.0, 59.0, 33.0, 24.0, 21.0, 12.0, 2.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.51825714111328, -25.00495719909668, -24.49165916442871, -23.97835922241211, -23.465059280395508, -22.95176124572754, -22.438461303710938, -21.925161361694336, -21.411863327026367, -20.898563385009766, -20.385265350341797, -19.871965408325195, -19.358665466308594, -18.845367431640625, -18.332067489624023, -17.818767547607422, -17.305469512939453, -16.79216957092285, -16.278871536254883, -15.765571594238281, -15.252272605895996, -14.738973617553711, -14.22567367553711, -13.712374687194824, -13.199073791503906, -12.685774803161621, -12.17247486114502, -11.659175872802734, -11.14587688446045, -10.632577896118164, -10.119277954101562, -9.605978965759277, -9.092679977416992, -8.579380989074707, -8.066081047058105, -7.55278205871582, -7.039483070373535, -6.526183605194092, -6.012884140014648, -5.499585151672363, -4.986285209655762, -4.472985744476318, -3.959686756134033, -3.44638729095459, -2.9330880641937256, -2.4197888374328613, -1.906489372253418, -1.3931901454925537, -0.8798909187316895, -0.3665916323661804, 0.1467076539993286, 0.6600069999694824, 1.1733062267303467, 1.686605453491211, 2.1999049186706543, 2.7132041454315186, 3.226503372192383, 3.739802598953247, 4.253101825714111, 4.766401290893555, 5.27970027923584, 5.792999744415283, 6.306299209594727, 6.819598197937012, 7.332897663116455]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 11.0, 12.0, 19.0, 43.0, 62.0, 104.0, 172.0, 456.0, 46070.0, 4146892.0, 333.0, 86.0, 25.0, 5.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-62.875, -61.713134765625, -60.55126953125, -59.389404296875, -58.2275390625, -57.065673828125, -55.90380859375, -54.741943359375, -53.580078125, -52.418212890625, -51.25634765625, -50.094482421875, -48.9326171875, -47.770751953125, -46.60888671875, -45.447021484375, -44.28515625, -43.123291015625, -41.96142578125, -40.799560546875, -39.6376953125, -38.475830078125, -37.31396484375, -36.152099609375, -34.990234375, -33.828369140625, -32.66650390625, -31.504638671875, -30.3427734375, -29.180908203125, -28.01904296875, -26.857177734375, -25.6953125, -24.533447265625, -23.37158203125, -22.209716796875, -21.0478515625, -19.885986328125, -18.72412109375, -17.562255859375, -16.400390625, -15.238525390625, -14.07666015625, -12.914794921875, -11.7529296875, -10.591064453125, -9.42919921875, -8.267333984375, -7.10546875, -5.943603515625, -4.78173828125, -3.619873046875, -2.4580078125, -1.296142578125, -0.13427734375, 1.027587890625, 2.189453125, 3.351318359375, 4.51318359375, 5.675048828125, 6.8369140625, 7.998779296875, 9.16064453125, 10.322509765625, 11.484375]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 9.0, 23.0, 106.0, 253.0, 330.0, 177.0, 87.0, 21.0, 5.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.4853515625, -1.4580039978027344, -1.4306564331054688, -1.4033088684082031, -1.3759613037109375, -1.3486137390136719, -1.3212661743164062, -1.2939186096191406, -1.266571044921875, -1.2392234802246094, -1.2118759155273438, -1.1845283508300781, -1.1571807861328125, -1.1298332214355469, -1.1024856567382812, -1.0751380920410156, -1.04779052734375, -1.0204429626464844, -0.9930953979492188, -0.9657478332519531, -0.9384002685546875, -0.9110527038574219, -0.8837051391601562, -0.8563575744628906, -0.829010009765625, -0.8016624450683594, -0.7743148803710938, -0.7469673156738281, -0.7196197509765625, -0.6922721862792969, -0.6649246215820312, -0.6375770568847656, -0.6102294921875, -0.5828819274902344, -0.5555343627929688, -0.5281867980957031, -0.5008392333984375, -0.4734916687011719, -0.44614410400390625, -0.4187965393066406, -0.391448974609375, -0.3641014099121094, -0.33675384521484375, -0.3094062805175781, -0.2820587158203125, -0.2547111511230469, -0.22736358642578125, -0.20001602172851562, -0.17266845703125, -0.14532089233398438, -0.11797332763671875, -0.09062576293945312, -0.0632781982421875, -0.035930633544921875, -0.00858306884765625, 0.018764495849609375, 0.046112060546875, 0.07345962524414062, 0.10080718994140625, 0.12815475463867188, 0.1555023193359375, 0.18284988403320312, 0.21019744873046875, 0.23754501342773438, 0.264892578125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 5.0, 3.0, 9.0, 23.0, 37.0, 90.0, 151.0, 344.0, 8762.0, 4183929.0, 646.0, 162.0, 73.0, 34.0, 13.0, 8.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.75, -40.2158203125, -38.681640625, -37.1474609375, -35.61328125, -34.0791015625, -32.544921875, -31.0107421875, -29.4765625, -27.9423828125, -26.408203125, -24.8740234375, -23.33984375, -21.8056640625, -20.271484375, -18.7373046875, -17.203125, -15.6689453125, -14.134765625, -12.6005859375, -11.06640625, -9.5322265625, -7.998046875, -6.4638671875, -4.9296875, -3.3955078125, -1.861328125, -0.3271484375, 1.20703125, 2.7412109375, 4.275390625, 5.8095703125, 7.34375, 8.8779296875, 10.412109375, 11.9462890625, 13.48046875, 15.0146484375, 16.548828125, 18.0830078125, 19.6171875, 21.1513671875, 22.685546875, 24.2197265625, 25.75390625, 27.2880859375, 28.822265625, 30.3564453125, 31.890625, 33.4248046875, 34.958984375, 36.4931640625, 38.02734375, 39.5615234375, 41.095703125, 42.6298828125, 44.1640625, 45.6982421875, 47.232421875, 48.7666015625, 50.30078125, 51.8349609375, 53.369140625, 54.9033203125, 56.4375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 10.0, 34.0, 333.0, 3464.0, 193.0, 35.0, 11.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-6.125, -6.012298583984375, -5.89959716796875, -5.786895751953125, -5.6741943359375, -5.561492919921875, -5.44879150390625, -5.336090087890625, -5.223388671875, -5.110687255859375, -4.99798583984375, -4.885284423828125, -4.7725830078125, -4.659881591796875, -4.54718017578125, -4.434478759765625, -4.32177734375, -4.209075927734375, -4.09637451171875, -3.983673095703125, -3.8709716796875, -3.758270263671875, -3.64556884765625, -3.532867431640625, -3.420166015625, -3.307464599609375, -3.19476318359375, -3.082061767578125, -2.9693603515625, -2.856658935546875, -2.74395751953125, -2.631256103515625, -2.5185546875, -2.405853271484375, -2.29315185546875, -2.180450439453125, -2.0677490234375, -1.955047607421875, -1.84234619140625, -1.729644775390625, -1.616943359375, -1.504241943359375, -1.39154052734375, -1.278839111328125, -1.1661376953125, -1.053436279296875, -0.94073486328125, -0.828033447265625, -0.71533203125, -0.602630615234375, -0.48992919921875, -0.377227783203125, -0.2645263671875, -0.151824951171875, -0.03912353515625, 0.073577880859375, 0.186279296875, 0.298980712890625, 0.41168212890625, 0.524383544921875, 0.6370849609375, 0.749786376953125, 0.86248779296875, 0.975189208984375, 1.087890625]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 11.0, 40.0, 411.0, 465.0, 60.0, 13.0, 6.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-48.2281379699707, -47.28314971923828, -46.33816146850586, -45.39317321777344, -44.448184967041016, -43.503196716308594, -42.55820846557617, -41.61322021484375, -40.668235778808594, -39.72324752807617, -38.77825927734375, -37.83327102661133, -36.888282775878906, -35.943294525146484, -34.99830627441406, -34.053321838378906, -33.10832977294922, -32.1633415222168, -31.218353271484375, -30.273365020751953, -29.32837677001953, -28.38338851928711, -27.43840217590332, -26.4934139251709, -25.548425674438477, -24.603437423706055, -23.658449172973633, -22.71346092224121, -21.768474578857422, -20.823486328125, -19.878498077392578, -18.933509826660156, -17.988521575927734, -17.043533325195312, -16.09854507446289, -15.153557777404785, -14.208569526672363, -13.263581275939941, -12.318593978881836, -11.373605728149414, -10.428617477416992, -9.48362922668457, -8.538640975952148, -7.593653678894043, -6.648665428161621, -5.703677177429199, -4.7586894035339355, -3.813701629638672, -2.86871337890625, -1.9237253665924072, -0.9787373542785645, -0.03374934196472168, 0.9112386703491211, 1.856226921081543, 2.8012146949768066, 3.7462024688720703, 4.691190719604492, 5.636178970336914, 6.581166744232178, 7.526154518127441, 8.471142768859863, 9.416131019592285, 10.36111831665039, 11.306106567382812, 12.251094818115234]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 10.0, 9.0, 30.0, 39.0, 55.0, 103.0, 100.0, 143.0, 143.0, 124.0, 85.0, 70.0, 45.0, 22.0, 18.0, 5.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-15.258219718933105, -14.819241523742676, -14.380263328552246, -13.941285133361816, -13.502307891845703, -13.063329696655273, -12.624351501464844, -12.185373306274414, -11.746395111083984, -11.307416915893555, -10.868438720703125, -10.429460525512695, -9.990482330322266, -9.551504135131836, -9.112526893615723, -8.673548698425293, -8.234570503234863, -7.795592308044434, -7.356614112854004, -6.917636394500732, -6.478658199310303, -6.039680004119873, -5.600702285766602, -5.161724090576172, -4.722745895385742, -4.2837677001953125, -3.844789743423462, -3.4058117866516113, -2.9668335914611816, -2.527855396270752, -2.0888774394989014, -1.6498994827270508, -1.2109203338623047, -0.7719422578811646, -0.3329641819000244, 0.10601389408111572, 0.5449919700622559, 0.9839701652526855, 1.4229481220245361, 1.8619260787963867, 2.3009042739868164, 2.739882469177246, 3.1788604259490967, 3.6178383827209473, 4.056816577911377, 4.495794773101807, 4.934772491455078, 5.373750686645508, 5.8127288818359375, 6.251707077026367, 6.690685272216797, 7.129662990570068, 7.568641185760498, 8.007619857788086, 8.4465970993042, 8.885575294494629, 9.324553489685059, 9.763531684875488, 10.202509880065918, 10.641488075256348, 11.080465316772461, 11.51944351196289, 11.95842170715332, 12.39739990234375, 12.83637809753418]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 4.0, 4.0, 6.0, 7.0, 9.0, 23.0, 18.0, 25.0, 31.0, 32.0, 67.0, 104.0, 202.0, 768.0, 5290.0, 208218.0, 818575.0, 13110.0, 1376.0, 312.0, 121.0, 70.0, 40.0, 34.0, 25.0, 21.0, 14.0, 14.0, 11.0, 10.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.9765625, -9.6458740234375, -9.315185546875, -8.9844970703125, -8.65380859375, -8.3231201171875, -7.992431640625, -7.6617431640625, -7.3310546875, -7.0003662109375, -6.669677734375, -6.3389892578125, -6.00830078125, -5.6776123046875, -5.346923828125, -5.0162353515625, -4.685546875, -4.3548583984375, -4.024169921875, -3.6934814453125, -3.36279296875, -3.0321044921875, -2.701416015625, -2.3707275390625, -2.0400390625, -1.7093505859375, -1.378662109375, -1.0479736328125, -0.71728515625, -0.3865966796875, -0.055908203125, 0.2747802734375, 0.60546875, 0.9361572265625, 1.266845703125, 1.5975341796875, 1.92822265625, 2.2589111328125, 2.589599609375, 2.9202880859375, 3.2509765625, 3.5816650390625, 3.912353515625, 4.2430419921875, 4.57373046875, 4.9044189453125, 5.235107421875, 5.5657958984375, 5.896484375, 6.2271728515625, 6.557861328125, 6.8885498046875, 7.21923828125, 7.5499267578125, 7.880615234375, 8.2113037109375, 8.5419921875, 8.8726806640625, 9.203369140625, 9.5340576171875, 9.86474609375, 10.1954345703125, 10.526123046875, 10.8568115234375, 11.1875]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 11.0, 12.0, 24.0, 80.0, 129.0, 186.0, 213.0, 170.0, 103.0, 55.0, 17.0, 7.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.765625, -1.7297210693359375, -1.693817138671875, -1.6579132080078125, -1.62200927734375, -1.5861053466796875, -1.550201416015625, -1.5142974853515625, -1.4783935546875, -1.4424896240234375, -1.406585693359375, -1.3706817626953125, -1.33477783203125, -1.2988739013671875, -1.262969970703125, -1.2270660400390625, -1.191162109375, -1.1552581787109375, -1.119354248046875, -1.0834503173828125, -1.04754638671875, -1.0116424560546875, -0.975738525390625, -0.9398345947265625, -0.9039306640625, -0.8680267333984375, -0.832122802734375, -0.7962188720703125, -0.76031494140625, -0.7244110107421875, -0.688507080078125, -0.6526031494140625, -0.61669921875, -0.5807952880859375, -0.544891357421875, -0.5089874267578125, -0.47308349609375, -0.4371795654296875, -0.401275634765625, -0.3653717041015625, -0.3294677734375, -0.2935638427734375, -0.257659912109375, -0.2217559814453125, -0.18585205078125, -0.1499481201171875, -0.114044189453125, -0.0781402587890625, -0.042236328125, -0.0063323974609375, 0.029571533203125, 0.0654754638671875, 0.10137939453125, 0.1372833251953125, 0.173187255859375, 0.2090911865234375, 0.2449951171875, 0.2808990478515625, 0.316802978515625, 0.3527069091796875, 0.38861083984375, 0.4245147705078125, 0.460418701171875, 0.4963226318359375, 0.5322265625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 9.0, 12.0, 9.0, 18.0, 26.0, 32.0, 55.0, 66.0, 95.0, 173.0, 292.0, 515.0, 1134.0, 3181.0, 14872.0, 129260.0, 719751.0, 156305.0, 16786.0, 3510.0, 1164.0, 526.0, 273.0, 165.0, 118.0, 65.0, 43.0, 29.0, 23.0, 13.0, 8.0, 9.0, 6.0, 4.0, 5.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.775390625, -3.66607666015625, -3.5567626953125, -3.44744873046875, -3.338134765625, -3.22882080078125, -3.1195068359375, -3.01019287109375, -2.90087890625, -2.79156494140625, -2.6822509765625, -2.57293701171875, -2.463623046875, -2.35430908203125, -2.2449951171875, -2.13568115234375, -2.0263671875, -1.91705322265625, -1.8077392578125, -1.69842529296875, -1.589111328125, -1.47979736328125, -1.3704833984375, -1.26116943359375, -1.15185546875, -1.04254150390625, -0.9332275390625, -0.82391357421875, -0.714599609375, -0.60528564453125, -0.4959716796875, -0.38665771484375, -0.27734375, -0.16802978515625, -0.0587158203125, 0.05059814453125, 0.159912109375, 0.26922607421875, 0.3785400390625, 0.48785400390625, 0.59716796875, 0.70648193359375, 0.8157958984375, 0.92510986328125, 1.034423828125, 1.14373779296875, 1.2530517578125, 1.36236572265625, 1.4716796875, 1.58099365234375, 1.6903076171875, 1.79962158203125, 1.908935546875, 2.01824951171875, 2.1275634765625, 2.23687744140625, 2.34619140625, 2.45550537109375, 2.5648193359375, 2.67413330078125, 2.783447265625, 2.89276123046875, 3.0020751953125, 3.11138916015625, 3.220703125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 6.0, 1.0, 3.0, 10.0, 8.0, 6.0, 12.0, 16.0, 16.0, 25.0, 29.0, 31.0, 39.0, 37.0, 51.0, 55.0, 64.0, 61.0, 70.0, 63.0, 67.0, 42.0, 43.0, 44.0, 40.0, 29.0, 28.0, 20.0, 27.0, 13.0, 10.0, 7.0, 11.0, 7.0, 4.0, 1.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.8857421875, -1.8341064453125, -1.782470703125, -1.7308349609375, -1.67919921875, -1.6275634765625, -1.575927734375, -1.5242919921875, -1.47265625, -1.4210205078125, -1.369384765625, -1.3177490234375, -1.26611328125, -1.2144775390625, -1.162841796875, -1.1112060546875, -1.0595703125, -1.0079345703125, -0.956298828125, -0.9046630859375, -0.85302734375, -0.8013916015625, -0.749755859375, -0.6981201171875, -0.646484375, -0.5948486328125, -0.543212890625, -0.4915771484375, -0.43994140625, -0.3883056640625, -0.336669921875, -0.2850341796875, -0.2333984375, -0.1817626953125, -0.130126953125, -0.0784912109375, -0.02685546875, 0.0247802734375, 0.076416015625, 0.1280517578125, 0.1796875, 0.2313232421875, 0.282958984375, 0.3345947265625, 0.38623046875, 0.4378662109375, 0.489501953125, 0.5411376953125, 0.5927734375, 0.6444091796875, 0.696044921875, 0.7476806640625, 0.79931640625, 0.8509521484375, 0.902587890625, 0.9542236328125, 1.005859375, 1.0574951171875, 1.109130859375, 1.1607666015625, 1.21240234375, 1.2640380859375, 1.315673828125, 1.3673095703125, 1.4189453125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 5.0, 3.0, 3.0, 7.0, 17.0, 34.0, 40.0, 65.0, 166.0, 466.0, 2426.0, 63968.0, 967812.0, 11883.0, 1100.0, 290.0, 140.0, 57.0, 34.0, 19.0, 7.0, 5.0, 6.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.171875, -5.95379638671875, -5.7357177734375, -5.51763916015625, -5.299560546875, -5.08148193359375, -4.8634033203125, -4.64532470703125, -4.42724609375, -4.20916748046875, -3.9910888671875, -3.77301025390625, -3.554931640625, -3.33685302734375, -3.1187744140625, -2.90069580078125, -2.6826171875, -2.46453857421875, -2.2464599609375, -2.02838134765625, -1.810302734375, -1.59222412109375, -1.3741455078125, -1.15606689453125, -0.93798828125, -0.71990966796875, -0.5018310546875, -0.28375244140625, -0.065673828125, 0.15240478515625, 0.3704833984375, 0.58856201171875, 0.806640625, 1.02471923828125, 1.2427978515625, 1.46087646484375, 1.678955078125, 1.89703369140625, 2.1151123046875, 2.33319091796875, 2.55126953125, 2.76934814453125, 2.9874267578125, 3.20550537109375, 3.423583984375, 3.64166259765625, 3.8597412109375, 4.07781982421875, 4.2958984375, 4.51397705078125, 4.7320556640625, 4.95013427734375, 5.168212890625, 5.38629150390625, 5.6043701171875, 5.82244873046875, 6.04052734375, 6.25860595703125, 6.4766845703125, 6.69476318359375, 6.912841796875, 7.13092041015625, 7.3489990234375, 7.56707763671875, 7.78515625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 5.0, 5.0, 3.0, 8.0, 16.0, 25.0, 58.0, 82.0, 159.0, 150.0, 185.0, 115.0, 70.0, 36.0, 22.0, 18.0, 11.0, 10.0, 6.0, 5.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00034737586975097656, -0.0003344342112541199, -0.0003214925527572632, -0.0003085508942604065, -0.0002956092357635498, -0.0002826675772666931, -0.0002697259187698364, -0.00025678426027297974, -0.00024384260177612305, -0.00023090094327926636, -0.00021795928478240967, -0.00020501762628555298, -0.0001920759677886963, -0.0001791343092918396, -0.0001661926507949829, -0.00015325099229812622, -0.00014030933380126953, -0.00012736767530441284, -0.00011442601680755615, -0.00010148435831069946, -8.854269981384277e-05, -7.560104131698608e-05, -6.26593828201294e-05, -4.9717724323272705e-05, -3.6776065826416016e-05, -2.3834407329559326e-05, -1.0892748832702637e-05, 2.0489096641540527e-06, 1.4990568161010742e-05, 2.793222665786743e-05, 4.087388515472412e-05, 5.381554365158081e-05, 6.67572021484375e-05, 7.969886064529419e-05, 9.264051914215088e-05, 0.00010558217763900757, 0.00011852383613586426, 0.00013146549463272095, 0.00014440715312957764, 0.00015734881162643433, 0.00017029047012329102, 0.0001832321286201477, 0.0001961737871170044, 0.00020911544561386108, 0.00022205710411071777, 0.00023499876260757446, 0.00024794042110443115, 0.00026088207960128784, 0.00027382373809814453, 0.0002867653965950012, 0.0002997070550918579, 0.0003126487135887146, 0.0003255903720855713, 0.000338532030582428, 0.00035147368907928467, 0.00036441534757614136, 0.00037735700607299805, 0.00039029866456985474, 0.0004032403230667114, 0.0004161819815635681, 0.0004291236400604248, 0.0004420652985572815, 0.0004550069570541382, 0.0004679486155509949, 0.00048089027404785156]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 3.0, 1.0, 3.0, 7.0, 6.0, 10.0, 13.0, 12.0, 18.0, 37.0, 75.0, 112.0, 233.0, 586.0, 1652.0, 6135.0, 47723.0, 891242.0, 89081.0, 8425.0, 2003.0, 630.0, 248.0, 122.0, 65.0, 45.0, 19.0, 15.0, 10.0, 10.0, 6.0, 8.0, 5.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.87109375, -4.74151611328125, -4.6119384765625, -4.48236083984375, -4.352783203125, -4.22320556640625, -4.0936279296875, -3.96405029296875, -3.83447265625, -3.70489501953125, -3.5753173828125, -3.44573974609375, -3.316162109375, -3.18658447265625, -3.0570068359375, -2.92742919921875, -2.7978515625, -2.66827392578125, -2.5386962890625, -2.40911865234375, -2.279541015625, -2.14996337890625, -2.0203857421875, -1.89080810546875, -1.76123046875, -1.63165283203125, -1.5020751953125, -1.37249755859375, -1.242919921875, -1.11334228515625, -0.9837646484375, -0.85418701171875, -0.724609375, -0.59503173828125, -0.4654541015625, -0.33587646484375, -0.206298828125, -0.07672119140625, 0.0528564453125, 0.18243408203125, 0.31201171875, 0.44158935546875, 0.5711669921875, 0.70074462890625, 0.830322265625, 0.95989990234375, 1.0894775390625, 1.21905517578125, 1.3486328125, 1.47821044921875, 1.6077880859375, 1.73736572265625, 1.866943359375, 1.99652099609375, 2.1260986328125, 2.25567626953125, 2.38525390625, 2.51483154296875, 2.6444091796875, 2.77398681640625, 2.903564453125, 3.03314208984375, 3.1627197265625, 3.29229736328125, 3.421875]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 6.0, 7.0, 9.0, 16.0, 26.0, 47.0, 95.0, 130.0, 193.0, 173.0, 114.0, 68.0, 35.0, 26.0, 19.0, 12.0, 6.0, 5.0, 6.0, 1.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.58203125, -2.5256805419921875, -2.469329833984375, -2.4129791259765625, -2.35662841796875, -2.3002777099609375, -2.243927001953125, -2.1875762939453125, -2.1312255859375, -2.0748748779296875, -2.018524169921875, -1.9621734619140625, -1.90582275390625, -1.8494720458984375, -1.793121337890625, -1.7367706298828125, -1.680419921875, -1.6240692138671875, -1.567718505859375, -1.5113677978515625, -1.45501708984375, -1.3986663818359375, -1.342315673828125, -1.2859649658203125, -1.2296142578125, -1.1732635498046875, -1.116912841796875, -1.0605621337890625, -1.00421142578125, -0.9478607177734375, -0.891510009765625, -0.8351593017578125, -0.77880859375, -0.7224578857421875, -0.666107177734375, -0.6097564697265625, -0.55340576171875, -0.4970550537109375, -0.440704345703125, -0.3843536376953125, -0.3280029296875, -0.2716522216796875, -0.215301513671875, -0.1589508056640625, -0.10260009765625, -0.0462493896484375, 0.010101318359375, 0.0664520263671875, 0.122802734375, 0.1791534423828125, 0.235504150390625, 0.2918548583984375, 0.34820556640625, 0.4045562744140625, 0.460906982421875, 0.5172576904296875, 0.5736083984375, 0.6299591064453125, 0.686309814453125, 0.7426605224609375, 0.79901123046875, 0.8553619384765625, 0.911712646484375, 0.9680633544921875, 1.0244140625]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 8.0, 17.0, 124.0, 517.0, 292.0, 45.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.78473663330078, -39.19800567626953, -37.611270904541016, -36.024539947509766, -34.43780517578125, -32.85107421875, -31.264341354370117, -29.677608489990234, -28.09087562561035, -26.50414276123047, -24.917409896850586, -23.330677032470703, -21.743946075439453, -20.157211303710938, -18.570480346679688, -16.983747482299805, -15.397014617919922, -13.810281753540039, -12.223548889160156, -10.63681697845459, -9.050084114074707, -7.463351249694824, -5.876619338989258, -4.289886474609375, -2.703153610229492, -1.1164209842681885, 0.47031164169311523, 2.05704402923584, 3.6437768936157227, 5.2305097579956055, 6.817241668701172, 8.403974533081055, 9.990707397460938, 11.57744026184082, 13.164173126220703, 14.75090503692627, 16.33763885498047, 17.92436981201172, 19.5111026763916, 21.097835540771484, 22.684568405151367, 24.27130126953125, 25.858034133911133, 27.444766998291016, 29.031497955322266, 30.61823272705078, 32.20496368408203, 33.79169464111328, 35.3784294128418, 36.96516036987305, 38.55189514160156, 40.13862609863281, 41.72536087036133, 43.31209182739258, 44.898826599121094, 46.485557556152344, 48.072288513183594, 49.659019470214844, 51.24575424194336, 52.83248519897461, 54.419219970703125, 56.005950927734375, 57.592681884765625, 59.17941665649414, 60.766151428222656]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 1.0, 4.0, 2.0, 1.0, 10.0, 17.0, 13.0, 24.0, 36.0, 20.0, 44.0, 44.0, 46.0, 43.0, 54.0, 57.0, 68.0, 46.0, 57.0, 59.0, 53.0, 55.0, 46.0, 43.0, 38.0, 29.0, 25.0, 12.0, 15.0, 14.0, 8.0, 7.0, 5.0, 5.0, 2.0, 1.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.869195938110352, -10.525186538696289, -10.18117618560791, -9.837166786193848, -9.493157386779785, -9.149147033691406, -8.805137634277344, -8.461128234863281, -8.117118835449219, -7.773108959197998, -7.4290995597839355, -7.085089683532715, -6.741080284118652, -6.397070407867432, -6.053060531616211, -5.709051132202148, -5.3650407791137695, -5.021030902862549, -4.677021503448486, -4.333011627197266, -3.989001989364624, -3.6449923515319824, -3.3009824752807617, -2.95697283744812, -2.6129631996154785, -2.268953561782837, -1.9249438047409058, -1.5809340476989746, -1.236924409866333, -0.8929147720336914, -0.5489048957824707, -0.2048952579498291, 0.1391143798828125, 0.4831240773200989, 0.8271337747573853, 1.1711435317993164, 1.515153169631958, 1.8591628074645996, 2.2031726837158203, 2.547182321548462, 2.8911919593811035, 3.235201597213745, 3.5792112350463867, 3.9232211112976074, 4.267230987548828, 4.611240386962891, 4.955250263214111, 5.299260139465332, 5.6432695388793945, 5.987279415130615, 6.331288814544678, 6.675298690795898, 7.019308090209961, 7.363317966461182, 7.707327842712402, 8.051337242126465, 8.395347595214844, 8.739356994628906, 9.083367347717285, 9.427376747131348, 9.77138614654541, 10.115396499633789, 10.459405899047852, 10.803415298461914, 11.147424697875977]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 7.0, 2.0, 2.0, 2.0, 7.0, 3.0, 7.0, 15.0, 5.0, 17.0, 21.0, 13.0, 20.0, 12.0, 30.0, 39.0, 32.0, 38.0, 46.0, 67.0, 95.0, 181.0, 425.0, 1324.0, 5536.0, 51309.0, 3996843.0, 126989.0, 9217.0, 1495.0, 314.0, 99.0, 37.0, 14.0, 7.0, 6.0, 8.0, 2.0, 1.0, 1.0], "bins": [-14.296875, -14.014495849609375, -13.73211669921875, -13.449737548828125, -13.1673583984375, -12.884979248046875, -12.60260009765625, -12.320220947265625, -12.037841796875, -11.755462646484375, -11.47308349609375, -11.190704345703125, -10.9083251953125, -10.625946044921875, -10.34356689453125, -10.061187744140625, -9.77880859375, -9.496429443359375, -9.21405029296875, -8.931671142578125, -8.6492919921875, -8.366912841796875, -8.08453369140625, -7.802154541015625, -7.519775390625, -7.237396240234375, -6.95501708984375, -6.672637939453125, -6.3902587890625, -6.107879638671875, -5.82550048828125, -5.543121337890625, -5.2607421875, -4.978363037109375, -4.69598388671875, -4.413604736328125, -4.1312255859375, -3.848846435546875, -3.56646728515625, -3.284088134765625, -3.001708984375, -2.719329833984375, -2.43695068359375, -2.154571533203125, -1.8721923828125, -1.589813232421875, -1.30743408203125, -1.025054931640625, -0.74267578125, -0.460296630859375, -0.17791748046875, 0.104461669921875, 0.3868408203125, 0.669219970703125, 0.95159912109375, 1.233978271484375, 1.516357421875, 1.798736572265625, 2.08111572265625, 2.363494873046875, 2.6458740234375, 2.928253173828125, 3.21063232421875, 3.493011474609375, 3.775390625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 12.0, 18.0, 46.0, 81.0, 117.0, 169.0, 176.0, 157.0, 103.0, 71.0, 25.0, 21.0, 10.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.712890625, -1.6801109313964844, -1.6473312377929688, -1.6145515441894531, -1.5817718505859375, -1.5489921569824219, -1.5162124633789062, -1.4834327697753906, -1.450653076171875, -1.4178733825683594, -1.3850936889648438, -1.3523139953613281, -1.3195343017578125, -1.2867546081542969, -1.2539749145507812, -1.2211952209472656, -1.18841552734375, -1.1556358337402344, -1.1228561401367188, -1.0900764465332031, -1.0572967529296875, -1.0245170593261719, -0.9917373657226562, -0.9589576721191406, -0.926177978515625, -0.8933982849121094, -0.8606185913085938, -0.8278388977050781, -0.7950592041015625, -0.7622795104980469, -0.7294998168945312, -0.6967201232910156, -0.6639404296875, -0.6311607360839844, -0.5983810424804688, -0.5656013488769531, -0.5328216552734375, -0.5000419616699219, -0.46726226806640625, -0.4344825744628906, -0.401702880859375, -0.3689231872558594, -0.33614349365234375, -0.3033638000488281, -0.2705841064453125, -0.23780441284179688, -0.20502471923828125, -0.17224502563476562, -0.13946533203125, -0.10668563842773438, -0.07390594482421875, -0.041126251220703125, -0.0083465576171875, 0.024433135986328125, 0.05721282958984375, 0.08999252319335938, 0.122772216796875, 0.15555191040039062, 0.18833160400390625, 0.22111129760742188, 0.2538909912109375, 0.2866706848144531, 0.31945037841796875, 0.3522300720214844, 0.385009765625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 8.0, 6.0, 12.0, 25.0, 45.0, 191.0, 596.0, 3472.0, 3840929.0, 346626.0, 1897.0, 322.0, 93.0, 33.0, 11.0, 5.0, 5.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.875, -27.26806640625, -26.6611328125, -26.05419921875, -25.447265625, -24.84033203125, -24.2333984375, -23.62646484375, -23.01953125, -22.41259765625, -21.8056640625, -21.19873046875, -20.591796875, -19.98486328125, -19.3779296875, -18.77099609375, -18.1640625, -17.55712890625, -16.9501953125, -16.34326171875, -15.736328125, -15.12939453125, -14.5224609375, -13.91552734375, -13.30859375, -12.70166015625, -12.0947265625, -11.48779296875, -10.880859375, -10.27392578125, -9.6669921875, -9.06005859375, -8.453125, -7.84619140625, -7.2392578125, -6.63232421875, -6.025390625, -5.41845703125, -4.8115234375, -4.20458984375, -3.59765625, -2.99072265625, -2.3837890625, -1.77685546875, -1.169921875, -0.56298828125, 0.0439453125, 0.65087890625, 1.2578125, 1.86474609375, 2.4716796875, 3.07861328125, 3.685546875, 4.29248046875, 4.8994140625, 5.50634765625, 6.11328125, 6.72021484375, 7.3271484375, 7.93408203125, 8.541015625, 9.14794921875, 9.7548828125, 10.36181640625, 10.96875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 5.0, 5.0, 18.0, 28.0, 34.0, 96.0, 271.0, 1788.0, 1441.0, 232.0, 86.0, 27.0, 16.0, 11.0, 6.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.55859375, -2.5063552856445312, -2.4541168212890625, -2.4018783569335938, -2.349639892578125, -2.2974014282226562, -2.2451629638671875, -2.1929244995117188, -2.14068603515625, -2.0884475708007812, -2.0362091064453125, -1.9839706420898438, -1.931732177734375, -1.8794937133789062, -1.8272552490234375, -1.7750167846679688, -1.7227783203125, -1.6705398559570312, -1.6183013916015625, -1.5660629272460938, -1.513824462890625, -1.4615859985351562, -1.4093475341796875, -1.3571090698242188, -1.30487060546875, -1.2526321411132812, -1.2003936767578125, -1.1481552124023438, -1.095916748046875, -1.0436782836914062, -0.9914398193359375, -0.9392013549804688, -0.886962890625, -0.8347244262695312, -0.7824859619140625, -0.7302474975585938, -0.678009033203125, -0.6257705688476562, -0.5735321044921875, -0.5212936401367188, -0.46905517578125, -0.41681671142578125, -0.3645782470703125, -0.31233978271484375, -0.260101318359375, -0.20786285400390625, -0.1556243896484375, -0.10338592529296875, -0.0511474609375, 0.00109100341796875, 0.0533294677734375, 0.10556793212890625, 0.157806396484375, 0.21004486083984375, 0.2622833251953125, 0.31452178955078125, 0.36676025390625, 0.41899871826171875, 0.4712371826171875, 0.5234756469726562, 0.575714111328125, 0.6279525756835938, 0.6801910400390625, 0.7324295043945312, 0.78466796875]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 7.0, 27.0, 100.0, 369.0, 388.0, 89.0, 12.0, 4.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.176610946655273, -19.61725616455078, -19.057903289794922, -18.49854850769043, -17.93919563293457, -17.379840850830078, -16.82048797607422, -16.261133193969727, -15.701780319213867, -15.142426490783691, -14.583072662353516, -14.02371883392334, -13.464365005493164, -12.905011177062988, -12.345657348632812, -11.78630256652832, -11.226948738098145, -10.667594909667969, -10.108241081237793, -9.548887252807617, -8.989533424377441, -8.430179595947266, -7.870825290679932, -7.311471462249756, -6.75211763381958, -6.192763805389404, -5.6334099769592285, -5.0740556716918945, -4.514701843261719, -3.955348253250122, -3.395994186401367, -2.8366403579711914, -2.2772865295410156, -1.7179327011108398, -1.1585787534713745, -0.5992248058319092, -0.0398709774017334, 0.5194828510284424, 1.0788369178771973, 1.638190746307373, 2.197544574737549, 2.7568984031677246, 3.3162522315979004, 3.8756062984466553, 4.43496036529541, 4.994314193725586, 5.553668022155762, 6.1130218505859375, 6.672375679016113, 7.231729507446289, 7.791083335876465, 8.35043716430664, 8.909790992736816, 9.469144821166992, 10.028499603271484, 10.587852478027344, 11.147207260131836, 11.706561088562012, 12.265914916992188, 12.825268745422363, 13.384622573852539, 13.943976402282715, 14.50333023071289, 15.062685012817383, 15.622037887573242]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 15.0, 14.0, 10.0, 21.0, 25.0, 46.0, 54.0, 68.0, 71.0, 74.0, 73.0, 84.0, 78.0, 79.0, 80.0, 52.0, 46.0, 30.0, 27.0, 23.0, 10.0, 7.0, 6.0, 4.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.320610046386719, -8.096750259399414, -7.872891426086426, -7.649032115936279, -7.425172805786133, -7.201313495635986, -6.97745418548584, -6.753594398498535, -6.529735565185547, -6.3058762550354, -6.082016944885254, -5.858157634735107, -5.634298324584961, -5.4104390144348145, -5.186579704284668, -4.962719917297363, -4.738860607147217, -4.51500129699707, -4.291141986846924, -4.067282676696777, -3.843423366546631, -3.6195640563964844, -3.395704507827759, -3.1718451976776123, -2.947985887527466, -2.7241265773773193, -2.500267267227173, -2.2764077186584473, -2.052548408508301, -1.8286892175674438, -1.6048297882080078, -1.3809704780578613, -1.157111644744873, -0.9332523345947266, -0.7093929648399353, -0.48553359508514404, -0.26167428493499756, -0.037814974784851074, 0.18604445457458496, 0.40990376472473145, 0.6337630748748779, 0.8576223850250244, 1.081481695175171, 1.305341124534607, 1.5292004346847534, 1.7530597448349, 1.976919174194336, 2.2007784843444824, 2.424637794494629, 2.6484971046447754, 2.872356414794922, 3.0962157249450684, 3.320075035095215, 3.5439343452453613, 3.767793893814087, 3.9916532039642334, 4.215512275695801, 4.439371585845947, 4.663230895996094, 4.88709020614624, 5.110949516296387, 5.334808826446533, 5.55866813659668, 5.782527923583984, 6.006387233734131]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 3.0, 3.0, 1.0, 5.0, 8.0, 17.0, 13.0, 19.0, 26.0, 39.0, 51.0, 84.0, 165.0, 281.0, 854.0, 3713.0, 34815.0, 696021.0, 294499.0, 14599.0, 2133.0, 593.0, 240.0, 122.0, 70.0, 49.0, 36.0, 33.0, 19.0, 15.0, 11.0, 8.0, 4.0, 4.0, 3.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.765625, -7.56036376953125, -7.3551025390625, -7.14984130859375, -6.944580078125, -6.73931884765625, -6.5340576171875, -6.32879638671875, -6.12353515625, -5.91827392578125, -5.7130126953125, -5.50775146484375, -5.302490234375, -5.09722900390625, -4.8919677734375, -4.68670654296875, -4.4814453125, -4.27618408203125, -4.0709228515625, -3.86566162109375, -3.660400390625, -3.45513916015625, -3.2498779296875, -3.04461669921875, -2.83935546875, -2.63409423828125, -2.4288330078125, -2.22357177734375, -2.018310546875, -1.81304931640625, -1.6077880859375, -1.40252685546875, -1.197265625, -0.99200439453125, -0.7867431640625, -0.58148193359375, -0.376220703125, -0.17095947265625, 0.0343017578125, 0.23956298828125, 0.44482421875, 0.65008544921875, 0.8553466796875, 1.06060791015625, 1.265869140625, 1.47113037109375, 1.6763916015625, 1.88165283203125, 2.0869140625, 2.29217529296875, 2.4974365234375, 2.70269775390625, 2.907958984375, 3.11322021484375, 3.3184814453125, 3.52374267578125, 3.72900390625, 3.93426513671875, 4.1395263671875, 4.34478759765625, 4.550048828125, 4.75531005859375, 4.9605712890625, 5.16583251953125, 5.37109375]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 9.0, 15.0, 22.0, 35.0, 62.0, 90.0, 106.0, 152.0, 132.0, 125.0, 100.0, 73.0, 35.0, 25.0, 12.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5654296875, -1.5314102172851562, -1.4973907470703125, -1.4633712768554688, -1.429351806640625, -1.3953323364257812, -1.3613128662109375, -1.3272933959960938, -1.29327392578125, -1.2592544555664062, -1.2252349853515625, -1.1912155151367188, -1.157196044921875, -1.1231765747070312, -1.0891571044921875, -1.0551376342773438, -1.0211181640625, -0.9870986938476562, -0.9530792236328125, -0.9190597534179688, -0.885040283203125, -0.8510208129882812, -0.8170013427734375, -0.7829818725585938, -0.74896240234375, -0.7149429321289062, -0.6809234619140625, -0.6469039916992188, -0.612884521484375, -0.5788650512695312, -0.5448455810546875, -0.5108261108398438, -0.476806640625, -0.44278717041015625, -0.4087677001953125, -0.37474822998046875, -0.340728759765625, -0.30670928955078125, -0.2726898193359375, -0.23867034912109375, -0.20465087890625, -0.17063140869140625, -0.1366119384765625, -0.10259246826171875, -0.068572998046875, -0.03455352783203125, -0.0005340576171875, 0.03348541259765625, 0.0675048828125, 0.10152435302734375, 0.1355438232421875, 0.16956329345703125, 0.203582763671875, 0.23760223388671875, 0.2716217041015625, 0.30564117431640625, 0.33966064453125, 0.37368011474609375, 0.4076995849609375, 0.44171905517578125, 0.475738525390625, 0.5097579956054688, 0.5437774658203125, 0.5777969360351562, 0.61181640625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 5.0, 1.0, 4.0, 6.0, 10.0, 10.0, 12.0, 26.0, 24.0, 42.0, 52.0, 59.0, 92.0, 171.0, 231.0, 439.0, 823.0, 2062.0, 5877.0, 21159.0, 104115.0, 494979.0, 337172.0, 60286.0, 13615.0, 4047.0, 1497.0, 689.0, 353.0, 216.0, 128.0, 116.0, 58.0, 43.0, 29.0, 29.0, 19.0, 12.0, 11.0, 6.0, 6.0, 6.0, 4.0, 2.0, 6.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0], "bins": [-2.517578125, -2.435943603515625, -2.35430908203125, -2.272674560546875, -2.1910400390625, -2.109405517578125, -2.02777099609375, -1.946136474609375, -1.864501953125, -1.782867431640625, -1.70123291015625, -1.619598388671875, -1.5379638671875, -1.456329345703125, -1.37469482421875, -1.293060302734375, -1.21142578125, -1.129791259765625, -1.04815673828125, -0.966522216796875, -0.8848876953125, -0.803253173828125, -0.72161865234375, -0.639984130859375, -0.558349609375, -0.476715087890625, -0.39508056640625, -0.313446044921875, -0.2318115234375, -0.150177001953125, -0.06854248046875, 0.013092041015625, 0.0947265625, 0.176361083984375, 0.25799560546875, 0.339630126953125, 0.4212646484375, 0.502899169921875, 0.58453369140625, 0.666168212890625, 0.747802734375, 0.829437255859375, 0.91107177734375, 0.992706298828125, 1.0743408203125, 1.155975341796875, 1.23760986328125, 1.319244384765625, 1.40087890625, 1.482513427734375, 1.56414794921875, 1.645782470703125, 1.7274169921875, 1.809051513671875, 1.89068603515625, 1.972320556640625, 2.053955078125, 2.135589599609375, 2.21722412109375, 2.298858642578125, 2.3804931640625, 2.462127685546875, 2.54376220703125, 2.625396728515625, 2.70703125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 8.0, 8.0, 12.0, 7.0, 13.0, 9.0, 9.0, 17.0, 22.0, 27.0, 24.0, 46.0, 42.0, 55.0, 40.0, 62.0, 60.0, 72.0, 56.0, 57.0, 55.0, 56.0, 41.0, 29.0, 30.0, 28.0, 24.0, 16.0, 16.0, 13.0, 15.0, 14.0, 6.0, 3.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8994140625, -1.8348846435546875, -1.770355224609375, -1.7058258056640625, -1.64129638671875, -1.5767669677734375, -1.512237548828125, -1.4477081298828125, -1.3831787109375, -1.3186492919921875, -1.254119873046875, -1.1895904541015625, -1.12506103515625, -1.0605316162109375, -0.996002197265625, -0.9314727783203125, -0.866943359375, -0.8024139404296875, -0.737884521484375, -0.6733551025390625, -0.60882568359375, -0.5442962646484375, -0.479766845703125, -0.4152374267578125, -0.3507080078125, -0.2861785888671875, -0.221649169921875, -0.1571197509765625, -0.09259033203125, -0.0280609130859375, 0.036468505859375, 0.1009979248046875, 0.16552734375, 0.2300567626953125, 0.294586181640625, 0.3591156005859375, 0.42364501953125, 0.4881744384765625, 0.552703857421875, 0.6172332763671875, 0.6817626953125, 0.7462921142578125, 0.810821533203125, 0.8753509521484375, 0.93988037109375, 1.0044097900390625, 1.068939208984375, 1.1334686279296875, 1.197998046875, 1.2625274658203125, 1.327056884765625, 1.3915863037109375, 1.45611572265625, 1.5206451416015625, 1.585174560546875, 1.6497039794921875, 1.7142333984375, 1.7787628173828125, 1.843292236328125, 1.9078216552734375, 1.97235107421875, 2.0368804931640625, 2.101409912109375, 2.1659393310546875, 2.23046875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 4.0, 1.0, 4.0, 2.0, 1.0, 7.0, 7.0, 14.0, 8.0, 21.0, 26.0, 53.0, 82.0, 155.0, 339.0, 879.0, 2682.0, 9913.0, 64032.0, 661177.0, 274849.0, 26316.0, 5317.0, 1581.0, 524.0, 274.0, 108.0, 64.0, 39.0, 24.0, 11.0, 9.0, 10.0, 6.0, 9.0, 3.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.70703125, -1.6533203125, -1.599609375, -1.5458984375, -1.4921875, -1.4384765625, -1.384765625, -1.3310546875, -1.27734375, -1.2236328125, -1.169921875, -1.1162109375, -1.0625, -1.0087890625, -0.955078125, -0.9013671875, -0.84765625, -0.7939453125, -0.740234375, -0.6865234375, -0.6328125, -0.5791015625, -0.525390625, -0.4716796875, -0.41796875, -0.3642578125, -0.310546875, -0.2568359375, -0.203125, -0.1494140625, -0.095703125, -0.0419921875, 0.01171875, 0.0654296875, 0.119140625, 0.1728515625, 0.2265625, 0.2802734375, 0.333984375, 0.3876953125, 0.44140625, 0.4951171875, 0.548828125, 0.6025390625, 0.65625, 0.7099609375, 0.763671875, 0.8173828125, 0.87109375, 0.9248046875, 0.978515625, 1.0322265625, 1.0859375, 1.1396484375, 1.193359375, 1.2470703125, 1.30078125, 1.3544921875, 1.408203125, 1.4619140625, 1.515625, 1.5693359375, 1.623046875, 1.6767578125, 1.73046875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 6.0, 1.0, 6.0, 8.0, 5.0, 22.0, 14.0, 26.0, 41.0, 50.0, 75.0, 104.0, 94.0, 97.0, 101.0, 84.0, 70.0, 48.0, 47.0, 40.0, 22.0, 19.0, 7.0, 5.0, 9.0, 3.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002434253692626953, -0.00023712962865829468, -0.00023083388805389404, -0.0002245381474494934, -0.00021824240684509277, -0.00021194666624069214, -0.0002056509256362915, -0.00019935518503189087, -0.00019305944442749023, -0.0001867637038230896, -0.00018046796321868896, -0.00017417222261428833, -0.0001678764820098877, -0.00016158074140548706, -0.00015528500080108643, -0.0001489892601966858, -0.00014269351959228516, -0.00013639777898788452, -0.0001301020383834839, -0.00012380629777908325, -0.00011751055717468262, -0.00011121481657028198, -0.00010491907596588135, -9.862333536148071e-05, -9.232759475708008e-05, -8.603185415267944e-05, -7.973611354827881e-05, -7.344037294387817e-05, -6.714463233947754e-05, -6.0848891735076904e-05, -5.455315113067627e-05, -4.8257410526275635e-05, -4.1961669921875e-05, -3.5665929317474365e-05, -2.937018871307373e-05, -2.3074448108673096e-05, -1.677870750427246e-05, -1.0482966899871826e-05, -4.187226295471191e-06, 2.1085143089294434e-06, 8.404254913330078e-06, 1.4699995517730713e-05, 2.0995736122131348e-05, 2.7291476726531982e-05, 3.358721733093262e-05, 3.988295793533325e-05, 4.617869853973389e-05, 5.247443914413452e-05, 5.8770179748535156e-05, 6.506592035293579e-05, 7.136166095733643e-05, 7.765740156173706e-05, 8.39531421661377e-05, 9.024888277053833e-05, 9.654462337493896e-05, 0.0001028403639793396, 0.00010913610458374023, 0.00011543184518814087, 0.0001217275857925415, 0.00012802332639694214, 0.00013431906700134277, 0.0001406148076057434, 0.00014691054821014404, 0.00015320628881454468, 0.0001595020294189453]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 4.0, 3.0, 9.0, 4.0, 10.0, 19.0, 18.0, 23.0, 41.0, 48.0, 74.0, 146.0, 251.0, 437.0, 856.0, 1770.0, 4112.0, 12147.0, 53046.0, 532934.0, 386768.0, 39328.0, 9640.0, 3497.0, 1583.0, 792.0, 376.0, 232.0, 123.0, 66.0, 52.0, 34.0, 28.0, 16.0, 17.0, 9.0, 8.0, 9.0, 4.0, 3.0, 3.0, 5.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-1.6142578125, -1.565216064453125, -1.51617431640625, -1.467132568359375, -1.4180908203125, -1.369049072265625, -1.32000732421875, -1.270965576171875, -1.221923828125, -1.172882080078125, -1.12384033203125, -1.074798583984375, -1.0257568359375, -0.976715087890625, -0.92767333984375, -0.878631591796875, -0.82958984375, -0.780548095703125, -0.73150634765625, -0.682464599609375, -0.6334228515625, -0.584381103515625, -0.53533935546875, -0.486297607421875, -0.437255859375, -0.388214111328125, -0.33917236328125, -0.290130615234375, -0.2410888671875, -0.192047119140625, -0.14300537109375, -0.093963623046875, -0.044921875, 0.004119873046875, 0.05316162109375, 0.102203369140625, 0.1512451171875, 0.200286865234375, 0.24932861328125, 0.298370361328125, 0.347412109375, 0.396453857421875, 0.44549560546875, 0.494537353515625, 0.5435791015625, 0.592620849609375, 0.64166259765625, 0.690704345703125, 0.73974609375, 0.788787841796875, 0.83782958984375, 0.886871337890625, 0.9359130859375, 0.984954833984375, 1.03399658203125, 1.083038330078125, 1.132080078125, 1.181121826171875, 1.23016357421875, 1.279205322265625, 1.3282470703125, 1.377288818359375, 1.42633056640625, 1.475372314453125, 1.5244140625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 8.0, 9.0, 18.0, 34.0, 49.0, 79.0, 108.0, 128.0, 164.0, 118.0, 103.0, 61.0, 41.0, 18.0, 16.0, 11.0, 8.0, 8.0, 4.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.4150390625, -1.377227783203125, -1.33941650390625, -1.301605224609375, -1.2637939453125, -1.225982666015625, -1.18817138671875, -1.150360107421875, -1.112548828125, -1.074737548828125, -1.03692626953125, -0.999114990234375, -0.9613037109375, -0.923492431640625, -0.88568115234375, -0.847869873046875, -0.81005859375, -0.772247314453125, -0.73443603515625, -0.696624755859375, -0.6588134765625, -0.621002197265625, -0.58319091796875, -0.545379638671875, -0.507568359375, -0.469757080078125, -0.43194580078125, -0.394134521484375, -0.3563232421875, -0.318511962890625, -0.28070068359375, -0.242889404296875, -0.205078125, -0.167266845703125, -0.12945556640625, -0.091644287109375, -0.0538330078125, -0.016021728515625, 0.02178955078125, 0.059600830078125, 0.097412109375, 0.135223388671875, 0.17303466796875, 0.210845947265625, 0.2486572265625, 0.286468505859375, 0.32427978515625, 0.362091064453125, 0.39990234375, 0.437713623046875, 0.47552490234375, 0.513336181640625, 0.5511474609375, 0.588958740234375, 0.62677001953125, 0.664581298828125, 0.702392578125, 0.740203857421875, 0.77801513671875, 0.815826416015625, 0.8536376953125, 0.891448974609375, 0.92926025390625, 0.967071533203125, 1.0048828125]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 13.0, 44.0, 88.0, 177.0, 241.0, 200.0, 120.0, 53.0, 28.0, 10.0, 8.0, 3.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.825170516967773, -21.15288734436035, -20.48060417175293, -19.808319091796875, -19.136035919189453, -18.46375274658203, -17.79146957397461, -17.119186401367188, -16.446903228759766, -15.774620056152344, -15.102335929870605, -14.430052757263184, -13.757768630981445, -13.085485458374023, -12.413202285766602, -11.74091911315918, -11.068634033203125, -10.396350860595703, -9.724066734313965, -9.051783561706543, -8.379499435424805, -7.707216262817383, -7.034933090209961, -6.362649440765381, -5.690365791320801, -5.018082141876221, -4.345798492431641, -3.6735153198242188, -3.0012316703796387, -2.3289480209350586, -1.6566648483276367, -0.9843811988830566, -0.3120994567871094, 0.36018407344818115, 1.0324676036834717, 1.7047510147094727, 2.3770346641540527, 3.049318313598633, 3.7216014862060547, 4.393885135650635, 5.066168785095215, 5.738452434539795, 6.410736083984375, 7.083019256591797, 7.755302906036377, 8.427586555480957, 9.099869728088379, 9.772153854370117, 10.444437026977539, 11.116720199584961, 11.7890043258667, 12.461287498474121, 13.13357162475586, 13.805854797363281, 14.478137969970703, 15.150421142578125, 15.822705268859863, 16.4949893951416, 17.167272567749023, 17.839555740356445, 18.511838912963867, 19.184123992919922, 19.856407165527344, 20.528690338134766, 21.200973510742188]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 1.0, 7.0, 4.0, 6.0, 6.0, 7.0, 13.0, 18.0, 25.0, 32.0, 25.0, 34.0, 28.0, 33.0, 36.0, 44.0, 46.0, 48.0, 59.0, 43.0, 42.0, 52.0, 49.0, 39.0, 43.0, 44.0, 33.0, 26.0, 21.0, 24.0, 28.0, 19.0, 10.0, 16.0, 15.0, 10.0, 7.0, 3.0, 5.0, 0.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.449064254760742, -11.130510330200195, -10.811956405639648, -10.493403434753418, -10.174849510192871, -9.856295585632324, -9.537741661071777, -9.219188690185547, -8.900634765625, -8.582080841064453, -8.263526916503906, -7.944973468780518, -7.626420021057129, -7.307866096496582, -6.989312171936035, -6.6707587242126465, -6.3522047996521, -6.033650875091553, -5.715097427368164, -5.396543502807617, -5.0779900550842285, -4.759436130523682, -4.440882682800293, -4.122328758239746, -3.8037750720977783, -3.4852213859558105, -3.1666676998138428, -2.848114013671875, -2.529560089111328, -2.2110066413879395, -1.8924527168273926, -1.5738990306854248, -1.255345344543457, -0.9367916584014893, -0.6182379126548767, -0.29968416690826416, 0.018869519233703613, 0.3374232053756714, 0.6559770107269287, 0.9745306968688965, 1.2930843830108643, 1.611638069152832, 1.9301917552947998, 2.2487454414367676, 2.5672993659973145, 2.885852813720703, 3.20440673828125, 3.5229604244232178, 3.8415141105651855, 4.160068035125732, 4.478621482849121, 4.797175407409668, 5.115728855133057, 5.4342827796936035, 5.752836227416992, 6.071390151977539, 6.389944076538086, 6.708498001098633, 7.0270514488220215, 7.345605373382568, 7.664158821105957, 7.982712745666504, 8.30126667022705, 8.619819641113281, 8.938373565673828]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 2.0, 3.0, 4.0, 4.0, 7.0, 4.0, 13.0, 7.0, 9.0, 8.0, 17.0, 17.0, 25.0, 15.0, 35.0, 36.0, 39.0, 79.0, 137.0, 182.0, 310.0, 680.0, 1722.0, 6498.0, 37899.0, 3642669.0, 473459.0, 23714.0, 4513.0, 1285.0, 490.0, 206.0, 92.0, 35.0, 29.0, 11.0, 15.0, 10.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.171875, -7.985626220703125, -7.79937744140625, -7.613128662109375, -7.4268798828125, -7.240631103515625, -7.05438232421875, -6.868133544921875, -6.681884765625, -6.495635986328125, -6.30938720703125, -6.123138427734375, -5.9368896484375, -5.750640869140625, -5.56439208984375, -5.378143310546875, -5.19189453125, -5.005645751953125, -4.81939697265625, -4.633148193359375, -4.4468994140625, -4.260650634765625, -4.07440185546875, -3.888153076171875, -3.701904296875, -3.515655517578125, -3.32940673828125, -3.143157958984375, -2.9569091796875, -2.770660400390625, -2.58441162109375, -2.398162841796875, -2.2119140625, -2.025665283203125, -1.83941650390625, -1.653167724609375, -1.4669189453125, -1.280670166015625, -1.09442138671875, -0.908172607421875, -0.721923828125, -0.535675048828125, -0.34942626953125, -0.163177490234375, 0.0230712890625, 0.209320068359375, 0.39556884765625, 0.581817626953125, 0.76806640625, 0.954315185546875, 1.14056396484375, 1.326812744140625, 1.5130615234375, 1.699310302734375, 1.88555908203125, 2.071807861328125, 2.258056640625, 2.444305419921875, 2.63055419921875, 2.816802978515625, 3.0030517578125, 3.189300537109375, 3.37554931640625, 3.561798095703125, 3.748046875]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 5.0, 5.0, 6.0, 9.0, 20.0, 31.0, 42.0, 76.0, 95.0, 107.0, 127.0, 124.0, 106.0, 86.0, 58.0, 44.0, 41.0, 9.0, 9.0, 7.0, 2.0, 1.0, 0.0, 2.0, 5.0, 1.0], "bins": [-1.5869140625, -1.5543861389160156, -1.5218582153320312, -1.4893302917480469, -1.4568023681640625, -1.4242744445800781, -1.3917465209960938, -1.3592185974121094, -1.326690673828125, -1.2941627502441406, -1.2616348266601562, -1.2291069030761719, -1.1965789794921875, -1.1640510559082031, -1.1315231323242188, -1.0989952087402344, -1.06646728515625, -1.0339393615722656, -1.0014114379882812, -0.9688835144042969, -0.9363555908203125, -0.9038276672363281, -0.8712997436523438, -0.8387718200683594, -0.806243896484375, -0.7737159729003906, -0.7411880493164062, -0.7086601257324219, -0.6761322021484375, -0.6436042785644531, -0.6110763549804688, -0.5785484313964844, -0.5460205078125, -0.5134925842285156, -0.48096466064453125, -0.4484367370605469, -0.4159088134765625, -0.3833808898925781, -0.35085296630859375, -0.3183250427246094, -0.285797119140625, -0.2532691955566406, -0.22074127197265625, -0.18821334838867188, -0.1556854248046875, -0.12315750122070312, -0.09062957763671875, -0.058101654052734375, -0.02557373046875, 0.006954193115234375, 0.03948211669921875, 0.07201004028320312, 0.1045379638671875, 0.13706588745117188, 0.16959381103515625, 0.20212173461914062, 0.234649658203125, 0.2671775817871094, 0.29970550537109375, 0.3322334289550781, 0.3647613525390625, 0.3972892761230469, 0.42981719970703125, 0.4623451232910156, 0.494873046875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 6.0, 12.0, 16.0, 32.0, 33.0, 78.0, 92.0, 167.0, 594.0, 4297.0, 4128943.0, 58235.0, 1247.0, 285.0, 106.0, 51.0, 43.0, 18.0, 12.0, 7.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.96875, -18.4383544921875, -17.907958984375, -17.3775634765625, -16.84716796875, -16.3167724609375, -15.786376953125, -15.2559814453125, -14.7255859375, -14.1951904296875, -13.664794921875, -13.1343994140625, -12.60400390625, -12.0736083984375, -11.543212890625, -11.0128173828125, -10.482421875, -9.9520263671875, -9.421630859375, -8.8912353515625, -8.36083984375, -7.8304443359375, -7.300048828125, -6.7696533203125, -6.2392578125, -5.7088623046875, -5.178466796875, -4.6480712890625, -4.11767578125, -3.5872802734375, -3.056884765625, -2.5264892578125, -1.99609375, -1.4656982421875, -0.935302734375, -0.4049072265625, 0.12548828125, 0.6558837890625, 1.186279296875, 1.7166748046875, 2.2470703125, 2.7774658203125, 3.307861328125, 3.8382568359375, 4.36865234375, 4.8990478515625, 5.429443359375, 5.9598388671875, 6.490234375, 7.0206298828125, 7.551025390625, 8.0814208984375, 8.61181640625, 9.1422119140625, 9.672607421875, 10.2030029296875, 10.7333984375, 11.2637939453125, 11.794189453125, 12.3245849609375, 12.85498046875, 13.3853759765625, 13.915771484375, 14.4461669921875, 14.9765625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 3.0, 9.0, 48.0, 146.0, 2306.0, 1412.0, 109.0, 23.0, 13.0, 9.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.21484375, -4.1231231689453125, -4.031402587890625, -3.9396820068359375, -3.84796142578125, -3.7562408447265625, -3.664520263671875, -3.5727996826171875, -3.4810791015625, -3.3893585205078125, -3.297637939453125, -3.2059173583984375, -3.11419677734375, -3.0224761962890625, -2.930755615234375, -2.8390350341796875, -2.747314453125, -2.6555938720703125, -2.563873291015625, -2.4721527099609375, -2.38043212890625, -2.2887115478515625, -2.196990966796875, -2.1052703857421875, -2.0135498046875, -1.9218292236328125, -1.830108642578125, -1.7383880615234375, -1.64666748046875, -1.5549468994140625, -1.463226318359375, -1.3715057373046875, -1.27978515625, -1.1880645751953125, -1.096343994140625, -1.0046234130859375, -0.91290283203125, -0.8211822509765625, -0.729461669921875, -0.6377410888671875, -0.5460205078125, -0.4542999267578125, -0.362579345703125, -0.2708587646484375, -0.17913818359375, -0.0874176025390625, 0.004302978515625, 0.0960235595703125, 0.187744140625, 0.2794647216796875, 0.371185302734375, 0.4629058837890625, 0.55462646484375, 0.6463470458984375, 0.738067626953125, 0.8297882080078125, 0.9215087890625, 1.0132293701171875, 1.104949951171875, 1.1966705322265625, 1.28839111328125, 1.3801116943359375, 1.471832275390625, 1.5635528564453125, 1.6552734375]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 3.0, 16.0, 48.0, 92.0, 163.0, 222.0, 221.0, 116.0, 54.0, 24.0, 14.0, 10.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.490737915039062, -11.239913940429688, -10.989089965820312, -10.738265991210938, -10.487442016601562, -10.236618041992188, -9.985794067382812, -9.734970092773438, -9.484146118164062, -9.233322143554688, -8.982498168945312, -8.731674194335938, -8.480850219726562, -8.230026245117188, -7.9792022705078125, -7.7283782958984375, -7.4775543212890625, -7.2267303466796875, -6.9759063720703125, -6.7250823974609375, -6.4742584228515625, -6.2234344482421875, -5.9726104736328125, -5.7217864990234375, -5.4709625244140625, -5.2201385498046875, -4.9693145751953125, -4.7184906005859375, -4.4676666259765625, -4.2168426513671875, -3.9660186767578125, -3.7151947021484375, -3.4643712043762207, -3.2135472297668457, -2.9627232551574707, -2.7118992805480957, -2.4610753059387207, -2.2102513313293457, -1.9594273567199707, -1.7086033821105957, -1.4577794075012207, -1.2069554328918457, -0.9561314582824707, -0.7053074836730957, -0.4544835090637207, -0.2036595344543457, 0.0471644401550293, 0.2979884147644043, 0.5488123893737793, 0.7996363639831543, 1.0504603385925293, 1.3012843132019043, 1.5521082878112793, 1.8029322624206543, 2.0537562370300293, 2.3045802116394043, 2.5554041862487793, 2.8062281608581543, 3.0570521354675293, 3.3078761100769043, 3.5587000846862793, 3.8095240592956543, 4.060348033905029, 4.311172008514404, 4.561995983123779]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 6.0, 11.0, 16.0, 19.0, 18.0, 33.0, 53.0, 68.0, 77.0, 70.0, 98.0, 91.0, 94.0, 93.0, 82.0, 53.0, 38.0, 31.0, 21.0, 14.0, 9.0, 12.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.294525146484375, -6.098509311676025, -5.902493000030518, -5.706477165222168, -5.510461330413818, -5.314445495605469, -5.118429183959961, -4.922413349151611, -4.726397514343262, -4.530381679534912, -4.334365367889404, -4.138349533081055, -3.942333698272705, -3.7463176250457764, -3.5503015518188477, -3.354285717010498, -3.1582694053649902, -2.9622533321380615, -2.766237497329712, -2.570221424102783, -2.3742055892944336, -2.178189516067505, -1.9821734428405762, -1.786157488822937, -1.5901415348052979, -1.3941255807876587, -1.1981096267700195, -1.0020935535430908, -0.8060775995254517, -0.6100616455078125, -0.4140455722808838, -0.21802961826324463, -0.022013187408447266, 0.17400279641151428, 0.37001878023147583, 0.5660347938537598, 0.7620507478713989, 0.9580667018890381, 1.1540827751159668, 1.350098729133606, 1.5461146831512451, 1.7421306371688843, 1.9381465911865234, 2.134162664413452, 2.330178737640381, 2.5261945724487305, 2.722210645675659, 2.918226718902588, 3.1142425537109375, 3.310258626937866, 3.506274461746216, 3.7022905349731445, 3.898306369781494, 4.094322204589844, 4.290338516235352, 4.486354351043701, 4.682370185852051, 4.8783860206604, 5.074402332305908, 5.270418167114258, 5.466434001922607, 5.662449836730957, 5.858466148376465, 6.0544819831848145, 6.250498294830322]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 6.0, 14.0, 13.0, 28.0, 27.0, 38.0, 87.0, 164.0, 282.0, 762.0, 2514.0, 15368.0, 355346.0, 642420.0, 26371.0, 3350.0, 1007.0, 342.0, 158.0, 89.0, 51.0, 33.0, 28.0, 14.0, 11.0, 8.0, 7.0, 8.0, 5.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.40625, -6.169921875, -5.93359375, -5.697265625, -5.4609375, -5.224609375, -4.98828125, -4.751953125, -4.515625, -4.279296875, -4.04296875, -3.806640625, -3.5703125, -3.333984375, -3.09765625, -2.861328125, -2.625, -2.388671875, -2.15234375, -1.916015625, -1.6796875, -1.443359375, -1.20703125, -0.970703125, -0.734375, -0.498046875, -0.26171875, -0.025390625, 0.2109375, 0.447265625, 0.68359375, 0.919921875, 1.15625, 1.392578125, 1.62890625, 1.865234375, 2.1015625, 2.337890625, 2.57421875, 2.810546875, 3.046875, 3.283203125, 3.51953125, 3.755859375, 3.9921875, 4.228515625, 4.46484375, 4.701171875, 4.9375, 5.173828125, 5.41015625, 5.646484375, 5.8828125, 6.119140625, 6.35546875, 6.591796875, 6.828125, 7.064453125, 7.30078125, 7.537109375, 7.7734375, 8.009765625, 8.24609375, 8.482421875, 8.71875]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 3.0, 3.0, 7.0, 18.0, 27.0, 45.0, 56.0, 75.0, 108.0, 90.0, 122.0, 111.0, 106.0, 62.0, 57.0, 39.0, 39.0, 17.0, 5.0, 6.0, 5.0, 0.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.572265625, -1.5384063720703125, -1.504547119140625, -1.4706878662109375, -1.43682861328125, -1.4029693603515625, -1.369110107421875, -1.3352508544921875, -1.3013916015625, -1.2675323486328125, -1.233673095703125, -1.1998138427734375, -1.16595458984375, -1.1320953369140625, -1.098236083984375, -1.0643768310546875, -1.030517578125, -0.9966583251953125, -0.962799072265625, -0.9289398193359375, -0.89508056640625, -0.8612213134765625, -0.827362060546875, -0.7935028076171875, -0.7596435546875, -0.7257843017578125, -0.691925048828125, -0.6580657958984375, -0.62420654296875, -0.5903472900390625, -0.556488037109375, -0.5226287841796875, -0.48876953125, -0.4549102783203125, -0.421051025390625, -0.3871917724609375, -0.35333251953125, -0.3194732666015625, -0.285614013671875, -0.2517547607421875, -0.2178955078125, -0.1840362548828125, -0.150177001953125, -0.1163177490234375, -0.08245849609375, -0.0485992431640625, -0.014739990234375, 0.0191192626953125, 0.052978515625, 0.0868377685546875, 0.120697021484375, 0.1545562744140625, 0.18841552734375, 0.2222747802734375, 0.256134033203125, 0.2899932861328125, 0.3238525390625, 0.3577117919921875, 0.391571044921875, 0.4254302978515625, 0.45928955078125, 0.4931488037109375, 0.527008056640625, 0.5608673095703125, 0.5947265625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 5.0, 4.0, 5.0, 8.0, 16.0, 21.0, 29.0, 42.0, 68.0, 105.0, 232.0, 421.0, 1087.0, 3324.0, 16299.0, 169329.0, 745556.0, 96431.0, 11273.0, 2595.0, 869.0, 378.0, 181.0, 103.0, 61.0, 27.0, 25.0, 15.0, 13.0, 7.0, 9.0, 3.0, 3.0, 4.0, 2.0, 4.0, 0.0, 1.0, 2.0], "bins": [-6.1953125, -6.045654296875, -5.89599609375, -5.746337890625, -5.5966796875, -5.447021484375, -5.29736328125, -5.147705078125, -4.998046875, -4.848388671875, -4.69873046875, -4.549072265625, -4.3994140625, -4.249755859375, -4.10009765625, -3.950439453125, -3.80078125, -3.651123046875, -3.50146484375, -3.351806640625, -3.2021484375, -3.052490234375, -2.90283203125, -2.753173828125, -2.603515625, -2.453857421875, -2.30419921875, -2.154541015625, -2.0048828125, -1.855224609375, -1.70556640625, -1.555908203125, -1.40625, -1.256591796875, -1.10693359375, -0.957275390625, -0.8076171875, -0.657958984375, -0.50830078125, -0.358642578125, -0.208984375, -0.059326171875, 0.09033203125, 0.239990234375, 0.3896484375, 0.539306640625, 0.68896484375, 0.838623046875, 0.98828125, 1.137939453125, 1.28759765625, 1.437255859375, 1.5869140625, 1.736572265625, 1.88623046875, 2.035888671875, 2.185546875, 2.335205078125, 2.48486328125, 2.634521484375, 2.7841796875, 2.933837890625, 3.08349609375, 3.233154296875, 3.3828125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 3.0, 3.0, 4.0, 6.0, 11.0, 11.0, 13.0, 24.0, 23.0, 37.0, 34.0, 45.0, 53.0, 62.0, 58.0, 63.0, 87.0, 72.0, 77.0, 56.0, 44.0, 49.0, 34.0, 26.0, 24.0, 21.0, 15.0, 18.0, 7.0, 5.0, 6.0, 5.0, 4.0, 0.0, 7.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.685546875, -3.584869384765625, -3.48419189453125, -3.383514404296875, -3.2828369140625, -3.182159423828125, -3.08148193359375, -2.980804443359375, -2.880126953125, -2.779449462890625, -2.67877197265625, -2.578094482421875, -2.4774169921875, -2.376739501953125, -2.27606201171875, -2.175384521484375, -2.07470703125, -1.974029541015625, -1.87335205078125, -1.772674560546875, -1.6719970703125, -1.571319580078125, -1.47064208984375, -1.369964599609375, -1.269287109375, -1.168609619140625, -1.06793212890625, -0.967254638671875, -0.8665771484375, -0.765899658203125, -0.66522216796875, -0.564544677734375, -0.4638671875, -0.363189697265625, -0.26251220703125, -0.161834716796875, -0.0611572265625, 0.039520263671875, 0.14019775390625, 0.240875244140625, 0.341552734375, 0.442230224609375, 0.54290771484375, 0.643585205078125, 0.7442626953125, 0.844940185546875, 0.94561767578125, 1.046295166015625, 1.14697265625, 1.247650146484375, 1.34832763671875, 1.449005126953125, 1.5496826171875, 1.650360107421875, 1.75103759765625, 1.851715087890625, 1.952392578125, 2.053070068359375, 2.15374755859375, 2.254425048828125, 2.3551025390625, 2.455780029296875, 2.55645751953125, 2.657135009765625, 2.7578125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 4.0, 1.0, 9.0, 9.0, 20.0, 37.0, 42.0, 75.0, 129.0, 247.0, 815.0, 4066.0, 57531.0, 922957.0, 57189.0, 4002.0, 834.0, 267.0, 133.0, 59.0, 57.0, 28.0, 17.0, 12.0, 4.0, 4.0, 5.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.912109375, -2.80621337890625, -2.7003173828125, -2.59442138671875, -2.488525390625, -2.38262939453125, -2.2767333984375, -2.17083740234375, -2.06494140625, -1.95904541015625, -1.8531494140625, -1.74725341796875, -1.641357421875, -1.53546142578125, -1.4295654296875, -1.32366943359375, -1.2177734375, -1.11187744140625, -1.0059814453125, -0.90008544921875, -0.794189453125, -0.68829345703125, -0.5823974609375, -0.47650146484375, -0.37060546875, -0.26470947265625, -0.1588134765625, -0.05291748046875, 0.052978515625, 0.15887451171875, 0.2647705078125, 0.37066650390625, 0.4765625, 0.58245849609375, 0.6883544921875, 0.79425048828125, 0.900146484375, 1.00604248046875, 1.1119384765625, 1.21783447265625, 1.32373046875, 1.42962646484375, 1.5355224609375, 1.64141845703125, 1.747314453125, 1.85321044921875, 1.9591064453125, 2.06500244140625, 2.1708984375, 2.27679443359375, 2.3826904296875, 2.48858642578125, 2.594482421875, 2.70037841796875, 2.8062744140625, 2.91217041015625, 3.01806640625, 3.12396240234375, 3.2298583984375, 3.33575439453125, 3.441650390625, 3.54754638671875, 3.6534423828125, 3.75933837890625, 3.865234375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 9.0, 8.0, 6.0, 11.0, 22.0, 30.0, 51.0, 70.0, 120.0, 173.0, 157.0, 117.0, 88.0, 54.0, 44.0, 18.0, 11.0, 9.0, 7.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006299018859863281, -0.0006162114441394806, -0.0006025210022926331, -0.0005888305604457855, -0.000575140118598938, -0.0005614496767520905, -0.0005477592349052429, -0.0005340687930583954, -0.0005203783512115479, -0.0005066879093647003, -0.0004929974675178528, -0.00047930702567100525, -0.0004656165838241577, -0.0004519261419773102, -0.00043823570013046265, -0.0004245452582836151, -0.0004108548164367676, -0.00039716437458992004, -0.0003834739327430725, -0.000369783490896225, -0.00035609304904937744, -0.0003424026072025299, -0.0003287121653556824, -0.00031502172350883484, -0.0003013312816619873, -0.00028764083981513977, -0.00027395039796829224, -0.0002602599561214447, -0.00024656951427459717, -0.00023287907242774963, -0.0002191886305809021, -0.00020549818873405457, -0.00019180774688720703, -0.0001781173050403595, -0.00016442686319351196, -0.00015073642134666443, -0.0001370459794998169, -0.00012335553765296936, -0.00010966509580612183, -9.597465395927429e-05, -8.228421211242676e-05, -6.859377026557922e-05, -5.490332841873169e-05, -4.1212886571884155e-05, -2.752244472503662e-05, -1.3832002878189087e-05, -1.4156103134155273e-07, 1.3548880815505981e-05, 2.7239322662353516e-05, 4.092976450920105e-05, 5.4620206356048584e-05, 6.831064820289612e-05, 8.200109004974365e-05, 9.569153189659119e-05, 0.00010938197374343872, 0.00012307241559028625, 0.0001367628574371338, 0.00015045329928398132, 0.00016414374113082886, 0.0001778341829776764, 0.00019152462482452393, 0.00020521506667137146, 0.000218905508518219, 0.00023259595036506653, 0.00024628639221191406]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 6.0, 8.0, 14.0, 30.0, 37.0, 91.0, 129.0, 275.0, 731.0, 2291.0, 13091.0, 293762.0, 704816.0, 28059.0, 3496.0, 916.0, 364.0, 184.0, 96.0, 74.0, 37.0, 22.0, 6.0, 4.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.21875, -3.13653564453125, -3.0543212890625, -2.97210693359375, -2.889892578125, -2.80767822265625, -2.7254638671875, -2.64324951171875, -2.56103515625, -2.47882080078125, -2.3966064453125, -2.31439208984375, -2.232177734375, -2.14996337890625, -2.0677490234375, -1.98553466796875, -1.9033203125, -1.82110595703125, -1.7388916015625, -1.65667724609375, -1.574462890625, -1.49224853515625, -1.4100341796875, -1.32781982421875, -1.24560546875, -1.16339111328125, -1.0811767578125, -0.99896240234375, -0.916748046875, -0.83453369140625, -0.7523193359375, -0.67010498046875, -0.587890625, -0.50567626953125, -0.4234619140625, -0.34124755859375, -0.259033203125, -0.17681884765625, -0.0946044921875, -0.01239013671875, 0.06982421875, 0.15203857421875, 0.2342529296875, 0.31646728515625, 0.398681640625, 0.48089599609375, 0.5631103515625, 0.64532470703125, 0.7275390625, 0.80975341796875, 0.8919677734375, 0.97418212890625, 1.056396484375, 1.13861083984375, 1.2208251953125, 1.30303955078125, 1.38525390625, 1.46746826171875, 1.5496826171875, 1.63189697265625, 1.714111328125, 1.79632568359375, 1.8785400390625, 1.96075439453125, 2.04296875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 7.0, 6.0, 14.0, 21.0, 37.0, 54.0, 80.0, 110.0, 156.0, 139.0, 124.0, 91.0, 59.0, 42.0, 31.0, 11.0, 11.0, 6.0, 5.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0546875, -1.0140838623046875, -0.973480224609375, -0.9328765869140625, -0.89227294921875, -0.8516693115234375, -0.811065673828125, -0.7704620361328125, -0.7298583984375, -0.6892547607421875, -0.648651123046875, -0.6080474853515625, -0.56744384765625, -0.5268402099609375, -0.486236572265625, -0.4456329345703125, -0.405029296875, -0.3644256591796875, -0.323822021484375, -0.2832183837890625, -0.24261474609375, -0.2020111083984375, -0.161407470703125, -0.1208038330078125, -0.0802001953125, -0.0395965576171875, 0.001007080078125, 0.0416107177734375, 0.08221435546875, 0.1228179931640625, 0.163421630859375, 0.2040252685546875, 0.24462890625, 0.2852325439453125, 0.325836181640625, 0.3664398193359375, 0.40704345703125, 0.4476470947265625, 0.488250732421875, 0.5288543701171875, 0.5694580078125, 0.6100616455078125, 0.650665283203125, 0.6912689208984375, 0.73187255859375, 0.7724761962890625, 0.813079833984375, 0.8536834716796875, 0.894287109375, 0.9348907470703125, 0.975494384765625, 1.0160980224609375, 1.05670166015625, 1.0973052978515625, 1.137908935546875, 1.1785125732421875, 1.2191162109375, 1.2597198486328125, 1.300323486328125, 1.3409271240234375, 1.38153076171875, 1.4221343994140625, 1.462738037109375, 1.5033416748046875, 1.5439453125]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 10.0, 16.0, 70.0, 159.0, 315.0, 245.0, 113.0, 42.0, 16.0, 12.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-57.54263687133789, -56.40836715698242, -55.27410125732422, -54.13983154296875, -53.00556182861328, -51.87129592895508, -50.73702621459961, -49.602760314941406, -48.46849060058594, -47.33422088623047, -46.199954986572266, -45.0656852722168, -43.931419372558594, -42.797149658203125, -41.662879943847656, -40.52861404418945, -39.394344329833984, -38.260074615478516, -37.12580871582031, -35.991539001464844, -34.857269287109375, -33.72300338745117, -32.5887336730957, -31.454465866088867, -30.32019805908203, -29.185930252075195, -28.05166244506836, -26.91739273071289, -25.783124923706055, -24.64885711669922, -23.51458740234375, -22.380319595336914, -21.246051788330078, -20.111783981323242, -18.977516174316406, -17.843246459960938, -16.7089786529541, -15.574710845947266, -14.440442085266113, -13.306173324584961, -12.171904563903809, -11.037635803222656, -9.90336799621582, -8.769100189208984, -7.634831428527832, -6.500563144683838, -5.366294860839844, -4.23202657699585, -3.0977582931518555, -1.9634900093078613, -0.8292217254638672, 0.30504655838012695, 1.439314842224121, 2.5735831260681152, 3.7078514099121094, 4.8421196937561035, 5.976387977600098, 7.110656261444092, 8.244924545288086, 9.379192352294922, 10.513461112976074, 11.647729873657227, 12.781997680664062, 13.916265487670898, 15.05053424835205]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 6.0, 6.0, 4.0, 10.0, 11.0, 4.0, 15.0, 27.0, 17.0, 25.0, 29.0, 37.0, 39.0, 37.0, 51.0, 57.0, 60.0, 50.0, 56.0, 67.0, 59.0, 45.0, 50.0, 33.0, 41.0, 34.0, 25.0, 38.0, 16.0, 12.0, 12.0, 6.0, 9.0, 9.0, 2.0, 4.0, 7.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.690654754638672, -16.20299530029297, -15.715333938598633, -15.22767448425293, -14.74001407623291, -14.25235366821289, -13.764693260192871, -13.277032852172852, -12.789373397827148, -12.301712989807129, -11.81405258178711, -11.326393127441406, -10.838732719421387, -10.351072311401367, -9.863411903381348, -9.375751495361328, -8.888091087341309, -8.400430679321289, -7.912770748138428, -7.425110340118408, -6.937450408935547, -6.449790000915527, -5.962129592895508, -5.474469184875488, -4.986809253692627, -4.499148845672607, -4.011488914489746, -3.5238285064697266, -3.036168336868286, -2.5485081672668457, -2.060847759246826, -1.5731875896453857, -1.0855283737182617, -0.5978681445121765, -0.11020791530609131, 0.37745237350463867, 0.8651125431060791, 1.3527727127075195, 1.840433120727539, 2.3280932903289795, 2.81575345993042, 3.3034136295318604, 3.791073799133301, 4.27873420715332, 4.76639461517334, 5.254054546356201, 5.741714954376221, 6.229374885559082, 6.717035293579102, 7.204695701599121, 7.692355632781982, 8.180015563964844, 8.667675971984863, 9.155336380004883, 9.642996788024902, 10.130657196044922, 10.618316650390625, 11.105977058410645, 11.593637466430664, 12.081296920776367, 12.568957328796387, 13.056617736816406, 13.544278144836426, 14.031938552856445, 14.519598960876465]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 6.0, 2.0, 1.0, 5.0, 6.0, 5.0, 5.0, 8.0, 15.0, 9.0, 22.0, 8.0, 12.0, 22.0, 32.0, 28.0, 34.0, 41.0, 47.0, 72.0, 80.0, 137.0, 195.0, 294.0, 490.0, 987.0, 2402.0, 6854.0, 25448.0, 198892.0, 3799736.0, 128417.0, 20562.0, 5727.0, 2036.0, 837.0, 401.0, 216.0, 89.0, 55.0, 34.0, 7.0, 5.0, 7.0, 4.0, 2.0, 1.0], "bins": [-8.828125, -8.641937255859375, -8.45574951171875, -8.269561767578125, -8.0833740234375, -7.897186279296875, -7.71099853515625, -7.524810791015625, -7.338623046875, -7.152435302734375, -6.96624755859375, -6.780059814453125, -6.5938720703125, -6.407684326171875, -6.22149658203125, -6.035308837890625, -5.84912109375, -5.662933349609375, -5.47674560546875, -5.290557861328125, -5.1043701171875, -4.918182373046875, -4.73199462890625, -4.545806884765625, -4.359619140625, -4.173431396484375, -3.98724365234375, -3.801055908203125, -3.6148681640625, -3.428680419921875, -3.24249267578125, -3.056304931640625, -2.8701171875, -2.683929443359375, -2.49774169921875, -2.311553955078125, -2.1253662109375, -1.939178466796875, -1.75299072265625, -1.566802978515625, -1.380615234375, -1.194427490234375, -1.00823974609375, -0.822052001953125, -0.6358642578125, -0.449676513671875, -0.26348876953125, -0.077301025390625, 0.10888671875, 0.295074462890625, 0.48126220703125, 0.667449951171875, 0.8536376953125, 1.039825439453125, 1.22601318359375, 1.412200927734375, 1.598388671875, 1.784576416015625, 1.97076416015625, 2.156951904296875, 2.3431396484375, 2.529327392578125, 2.71551513671875, 2.901702880859375, 3.087890625]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 5.0, 13.0, 14.0, 27.0, 46.0, 50.0, 79.0, 79.0, 83.0, 117.0, 106.0, 91.0, 76.0, 66.0, 56.0, 38.0, 21.0, 12.0, 13.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0], "bins": [-1.5615234375, -1.5288467407226562, -1.4961700439453125, -1.4634933471679688, -1.430816650390625, -1.3981399536132812, -1.3654632568359375, -1.3327865600585938, -1.30010986328125, -1.2674331665039062, -1.2347564697265625, -1.2020797729492188, -1.169403076171875, -1.1367263793945312, -1.1040496826171875, -1.0713729858398438, -1.0386962890625, -1.0060195922851562, -0.9733428955078125, -0.9406661987304688, -0.907989501953125, -0.8753128051757812, -0.8426361083984375, -0.8099594116210938, -0.77728271484375, -0.7446060180664062, -0.7119293212890625, -0.6792526245117188, -0.646575927734375, -0.6138992309570312, -0.5812225341796875, -0.5485458374023438, -0.515869140625, -0.48319244384765625, -0.4505157470703125, -0.41783905029296875, -0.385162353515625, -0.35248565673828125, -0.3198089599609375, -0.28713226318359375, -0.25445556640625, -0.22177886962890625, -0.1891021728515625, -0.15642547607421875, -0.123748779296875, -0.09107208251953125, -0.0583953857421875, -0.02571868896484375, 0.0069580078125, 0.03963470458984375, 0.0723114013671875, 0.10498809814453125, 0.137664794921875, 0.17034149169921875, 0.2030181884765625, 0.23569488525390625, 0.26837158203125, 0.30104827880859375, 0.3337249755859375, 0.36640167236328125, 0.399078369140625, 0.43175506591796875, 0.4644317626953125, 0.49710845947265625, 0.52978515625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 4.0, 3.0, 4.0, 14.0, 11.0, 12.0, 34.0, 50.0, 78.0, 171.0, 342.0, 654.0, 1677.0, 4494.0, 27414.0, 4005446.0, 142847.0, 7488.0, 2007.0, 803.0, 357.0, 166.0, 76.0, 52.0, 28.0, 17.0, 11.0, 4.0, 5.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.0625, -13.70849609375, -13.3544921875, -13.00048828125, -12.646484375, -12.29248046875, -11.9384765625, -11.58447265625, -11.23046875, -10.87646484375, -10.5224609375, -10.16845703125, -9.814453125, -9.46044921875, -9.1064453125, -8.75244140625, -8.3984375, -8.04443359375, -7.6904296875, -7.33642578125, -6.982421875, -6.62841796875, -6.2744140625, -5.92041015625, -5.56640625, -5.21240234375, -4.8583984375, -4.50439453125, -4.150390625, -3.79638671875, -3.4423828125, -3.08837890625, -2.734375, -2.38037109375, -2.0263671875, -1.67236328125, -1.318359375, -0.96435546875, -0.6103515625, -0.25634765625, 0.09765625, 0.45166015625, 0.8056640625, 1.15966796875, 1.513671875, 1.86767578125, 2.2216796875, 2.57568359375, 2.9296875, 3.28369140625, 3.6376953125, 3.99169921875, 4.345703125, 4.69970703125, 5.0537109375, 5.40771484375, 5.76171875, 6.11572265625, 6.4697265625, 6.82373046875, 7.177734375, 7.53173828125, 7.8857421875, 8.23974609375, 8.59375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 4.0, 4.0, 2.0, 8.0, 4.0, 12.0, 19.0, 37.0, 85.0, 254.0, 2199.0, 1188.0, 160.0, 49.0, 23.0, 9.0, 10.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7578125, -4.6385498046875, -4.519287109375, -4.4000244140625, -4.28076171875, -4.1614990234375, -4.042236328125, -3.9229736328125, -3.8037109375, -3.6844482421875, -3.565185546875, -3.4459228515625, -3.32666015625, -3.2073974609375, -3.088134765625, -2.9688720703125, -2.849609375, -2.7303466796875, -2.611083984375, -2.4918212890625, -2.37255859375, -2.2532958984375, -2.134033203125, -2.0147705078125, -1.8955078125, -1.7762451171875, -1.656982421875, -1.5377197265625, -1.41845703125, -1.2991943359375, -1.179931640625, -1.0606689453125, -0.94140625, -0.8221435546875, -0.702880859375, -0.5836181640625, -0.46435546875, -0.3450927734375, -0.225830078125, -0.1065673828125, 0.0126953125, 0.1319580078125, 0.251220703125, 0.3704833984375, 0.48974609375, 0.6090087890625, 0.728271484375, 0.8475341796875, 0.966796875, 1.0860595703125, 1.205322265625, 1.3245849609375, 1.44384765625, 1.5631103515625, 1.682373046875, 1.8016357421875, 1.9208984375, 2.0401611328125, 2.159423828125, 2.2786865234375, 2.39794921875, 2.5172119140625, 2.636474609375, 2.7557373046875, 2.875]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 14.0, 50.0, 161.0, 389.0, 291.0, 75.0, 13.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0], "bins": [-49.422332763671875, -48.52080154418945, -47.6192741394043, -46.717742919921875, -45.81621170043945, -44.91468048095703, -44.013153076171875, -43.11162185668945, -42.21009063720703, -41.30855941772461, -40.40703201293945, -39.50550079345703, -38.60396957397461, -37.70243835449219, -36.80091094970703, -35.89937973022461, -34.99784851074219, -34.096317291259766, -33.19478988647461, -32.29325866699219, -31.391727447509766, -30.490198135375977, -29.588668823242188, -28.687137603759766, -27.78561019897461, -26.88408088684082, -25.9825496673584, -25.08102035522461, -24.179489135742188, -23.2779598236084, -22.37643051147461, -21.474899291992188, -20.573368072509766, -19.671838760375977, -18.770307540893555, -17.868778228759766, -16.967247009277344, -16.065717697143555, -15.16418743133545, -14.262657165527344, -13.361126899719238, -12.459596633911133, -11.558066368103027, -10.656536102294922, -9.755006790161133, -8.853475570678711, -7.951946258544922, -7.050415992736816, -6.148885726928711, -5.2473554611206055, -4.3458251953125, -3.4442954063415527, -2.5427651405334473, -1.6412348747253418, -0.7397050857543945, 0.16182518005371094, 1.0633554458618164, 1.9648855924606323, 2.8664157390594482, 3.7679457664489746, 4.66947603225708, 5.5710062980651855, 6.472536087036133, 7.374066352844238, 8.275596618652344]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 5.0, 18.0, 27.0, 39.0, 76.0, 142.0, 162.0, 172.0, 141.0, 106.0, 59.0, 24.0, 23.0, 6.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.877960205078125, -17.244781494140625, -16.611602783203125, -15.978422164916992, -15.345243453979492, -14.712064743041992, -14.078885078430176, -13.44570541381836, -12.81252670288086, -12.17934799194336, -11.546168327331543, -10.912988662719727, -10.279809951782227, -9.646631240844727, -9.01345157623291, -8.380271911621094, -7.747093200683594, -7.1139140129089355, -6.480734825134277, -5.847555637359619, -5.214376449584961, -4.581197261810303, -3.9480180740356445, -3.3148388862609863, -2.681659698486328, -2.04848051071167, -1.4153013229370117, -0.7821221351623535, -0.1489429473876953, 0.4842362403869629, 1.117415428161621, 1.7505946159362793, 2.3837757110595703, 3.0169548988342285, 3.6501340866088867, 4.283313274383545, 4.916492462158203, 5.549671649932861, 6.1828508377075195, 6.816030025482178, 7.449209213256836, 8.082387924194336, 8.715567588806152, 9.348747253417969, 9.981925964355469, 10.615104675292969, 11.248284339904785, 11.881464004516602, 12.514642715454102, 13.147821426391602, 13.781001091003418, 14.414180755615234, 15.047359466552734, 15.680538177490234, 16.313716888427734, 16.946897506713867, 17.580076217651367, 18.213254928588867, 18.846435546875, 19.4796142578125, 20.11279296875, 20.7459716796875, 21.379150390625, 22.012331008911133, 22.645509719848633]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 4.0, 7.0, 7.0, 10.0, 12.0, 18.0, 29.0, 37.0, 70.0, 116.0, 211.0, 413.0, 945.0, 2594.0, 13119.0, 191050.0, 772143.0, 58391.0, 6363.0, 1602.0, 680.0, 290.0, 159.0, 101.0, 62.0, 42.0, 26.0, 17.0, 13.0, 8.0, 6.0, 6.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.859375, -7.63677978515625, -7.4141845703125, -7.19158935546875, -6.968994140625, -6.74639892578125, -6.5238037109375, -6.30120849609375, -6.07861328125, -5.85601806640625, -5.6334228515625, -5.41082763671875, -5.188232421875, -4.96563720703125, -4.7430419921875, -4.52044677734375, -4.2978515625, -4.07525634765625, -3.8526611328125, -3.63006591796875, -3.407470703125, -3.18487548828125, -2.9622802734375, -2.73968505859375, -2.51708984375, -2.29449462890625, -2.0718994140625, -1.84930419921875, -1.626708984375, -1.40411376953125, -1.1815185546875, -0.95892333984375, -0.736328125, -0.51373291015625, -0.2911376953125, -0.06854248046875, 0.154052734375, 0.37664794921875, 0.5992431640625, 0.82183837890625, 1.04443359375, 1.26702880859375, 1.4896240234375, 1.71221923828125, 1.934814453125, 2.15740966796875, 2.3800048828125, 2.60260009765625, 2.8251953125, 3.04779052734375, 3.2703857421875, 3.49298095703125, 3.715576171875, 3.93817138671875, 4.1607666015625, 4.38336181640625, 4.60595703125, 4.82855224609375, 5.0511474609375, 5.27374267578125, 5.496337890625, 5.71893310546875, 5.9415283203125, 6.16412353515625, 6.38671875]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 8.0, 5.0, 15.0, 31.0, 30.0, 81.0, 91.0, 109.0, 143.0, 118.0, 120.0, 83.0, 68.0, 35.0, 28.0, 16.0, 15.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.87109375, -1.8275375366210938, -1.7839813232421875, -1.7404251098632812, -1.696868896484375, -1.6533126831054688, -1.6097564697265625, -1.5662002563476562, -1.52264404296875, -1.4790878295898438, -1.4355316162109375, -1.3919754028320312, -1.348419189453125, -1.3048629760742188, -1.2613067626953125, -1.2177505493164062, -1.1741943359375, -1.1306381225585938, -1.0870819091796875, -1.0435256958007812, -0.999969482421875, -0.9564132690429688, -0.9128570556640625, -0.8693008422851562, -0.82574462890625, -0.7821884155273438, -0.7386322021484375, -0.6950759887695312, -0.651519775390625, -0.6079635620117188, -0.5644073486328125, -0.5208511352539062, -0.477294921875, -0.43373870849609375, -0.3901824951171875, -0.34662628173828125, -0.303070068359375, -0.25951385498046875, -0.2159576416015625, -0.17240142822265625, -0.12884521484375, -0.08528900146484375, -0.0417327880859375, 0.00182342529296875, 0.045379638671875, 0.08893585205078125, 0.1324920654296875, 0.17604827880859375, 0.2196044921875, 0.26316070556640625, 0.3067169189453125, 0.35027313232421875, 0.393829345703125, 0.43738555908203125, 0.4809417724609375, 0.5244979858398438, 0.56805419921875, 0.6116104125976562, 0.6551666259765625, 0.6987228393554688, 0.742279052734375, 0.7858352661132812, 0.8293914794921875, 0.8729476928710938, 0.91650390625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 4.0, 7.0, 8.0, 13.0, 29.0, 41.0, 61.0, 111.0, 241.0, 521.0, 1327.0, 5045.0, 27439.0, 230456.0, 641208.0, 121133.0, 15805.0, 3302.0, 981.0, 386.0, 187.0, 102.0, 53.0, 33.0, 25.0, 10.0, 8.0, 4.0, 8.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.435546875, -3.318511962890625, -3.20147705078125, -3.084442138671875, -2.9674072265625, -2.850372314453125, -2.73333740234375, -2.616302490234375, -2.499267578125, -2.382232666015625, -2.26519775390625, -2.148162841796875, -2.0311279296875, -1.914093017578125, -1.79705810546875, -1.680023193359375, -1.56298828125, -1.445953369140625, -1.32891845703125, -1.211883544921875, -1.0948486328125, -0.977813720703125, -0.86077880859375, -0.743743896484375, -0.626708984375, -0.509674072265625, -0.39263916015625, -0.275604248046875, -0.1585693359375, -0.041534423828125, 0.07550048828125, 0.192535400390625, 0.3095703125, 0.426605224609375, 0.54364013671875, 0.660675048828125, 0.7777099609375, 0.894744873046875, 1.01177978515625, 1.128814697265625, 1.245849609375, 1.362884521484375, 1.47991943359375, 1.596954345703125, 1.7139892578125, 1.831024169921875, 1.94805908203125, 2.065093994140625, 2.18212890625, 2.299163818359375, 2.41619873046875, 2.533233642578125, 2.6502685546875, 2.767303466796875, 2.88433837890625, 3.001373291015625, 3.118408203125, 3.235443115234375, 3.35247802734375, 3.469512939453125, 3.5865478515625, 3.703582763671875, 3.82061767578125, 3.937652587890625, 4.0546875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 4.0, 10.0, 11.0, 17.0, 14.0, 22.0, 21.0, 25.0, 32.0, 33.0, 43.0, 45.0, 45.0, 46.0, 48.0, 54.0, 49.0, 47.0, 43.0, 48.0, 46.0, 38.0, 43.0, 27.0, 27.0, 36.0, 16.0, 24.0, 9.0, 17.0, 13.0, 6.0, 6.0, 8.0, 7.0, 9.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.4453125, -2.369781494140625, -2.29425048828125, -2.218719482421875, -2.1431884765625, -2.067657470703125, -1.99212646484375, -1.916595458984375, -1.841064453125, -1.765533447265625, -1.69000244140625, -1.614471435546875, -1.5389404296875, -1.463409423828125, -1.38787841796875, -1.312347412109375, -1.23681640625, -1.161285400390625, -1.08575439453125, -1.010223388671875, -0.9346923828125, -0.859161376953125, -0.78363037109375, -0.708099365234375, -0.632568359375, -0.557037353515625, -0.48150634765625, -0.405975341796875, -0.3304443359375, -0.254913330078125, -0.17938232421875, -0.103851318359375, -0.0283203125, 0.047210693359375, 0.12274169921875, 0.198272705078125, 0.2738037109375, 0.349334716796875, 0.42486572265625, 0.500396728515625, 0.575927734375, 0.651458740234375, 0.72698974609375, 0.802520751953125, 0.8780517578125, 0.953582763671875, 1.02911376953125, 1.104644775390625, 1.18017578125, 1.255706787109375, 1.33123779296875, 1.406768798828125, 1.4822998046875, 1.557830810546875, 1.63336181640625, 1.708892822265625, 1.784423828125, 1.859954833984375, 1.93548583984375, 2.011016845703125, 2.0865478515625, 2.162078857421875, 2.23760986328125, 2.313140869140625, 2.388671875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 7.0, 8.0, 13.0, 25.0, 52.0, 65.0, 118.0, 234.0, 394.0, 905.0, 2430.0, 7676.0, 34192.0, 292483.0, 609831.0, 80000.0, 13714.0, 3782.0, 1412.0, 579.0, 270.0, 154.0, 84.0, 43.0, 28.0, 12.0, 11.0, 6.0, 8.0, 8.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.474609375, -1.4223480224609375, -1.370086669921875, -1.3178253173828125, -1.26556396484375, -1.2133026123046875, -1.161041259765625, -1.1087799072265625, -1.0565185546875, -1.0042572021484375, -0.951995849609375, -0.8997344970703125, -0.84747314453125, -0.7952117919921875, -0.742950439453125, -0.6906890869140625, -0.638427734375, -0.5861663818359375, -0.533905029296875, -0.4816436767578125, -0.42938232421875, -0.3771209716796875, -0.324859619140625, -0.2725982666015625, -0.2203369140625, -0.1680755615234375, -0.115814208984375, -0.0635528564453125, -0.01129150390625, 0.0409698486328125, 0.093231201171875, 0.1454925537109375, 0.19775390625, 0.2500152587890625, 0.302276611328125, 0.3545379638671875, 0.40679931640625, 0.4590606689453125, 0.511322021484375, 0.5635833740234375, 0.6158447265625, 0.6681060791015625, 0.720367431640625, 0.7726287841796875, 0.82489013671875, 0.8771514892578125, 0.929412841796875, 0.9816741943359375, 1.033935546875, 1.0861968994140625, 1.138458251953125, 1.1907196044921875, 1.24298095703125, 1.2952423095703125, 1.347503662109375, 1.3997650146484375, 1.4520263671875, 1.5042877197265625, 1.556549072265625, 1.6088104248046875, 1.66107177734375, 1.7133331298828125, 1.765594482421875, 1.8178558349609375, 1.8701171875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 8.0, 4.0, 8.0, 10.0, 11.0, 34.0, 18.0, 38.0, 51.0, 66.0, 75.0, 69.0, 83.0, 76.0, 101.0, 83.0, 53.0, 48.0, 37.0, 28.0, 22.0, 27.0, 13.0, 11.0, 6.0, 11.0, 4.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002548694610595703, -0.00024819374084472656, -0.0002415180206298828, -0.00023484230041503906, -0.0002281665802001953, -0.00022149085998535156, -0.0002148151397705078, -0.00020813941955566406, -0.0002014636993408203, -0.00019478797912597656, -0.0001881122589111328, -0.00018143653869628906, -0.0001747608184814453, -0.00016808509826660156, -0.0001614093780517578, -0.00015473365783691406, -0.0001480579376220703, -0.00014138221740722656, -0.0001347064971923828, -0.00012803077697753906, -0.00012135505676269531, -0.00011467933654785156, -0.00010800361633300781, -0.00010132789611816406, -9.465217590332031e-05, -8.797645568847656e-05, -8.130073547363281e-05, -7.462501525878906e-05, -6.794929504394531e-05, -6.127357482910156e-05, -5.459785461425781e-05, -4.792213439941406e-05, -4.124641418457031e-05, -3.457069396972656e-05, -2.7894973754882812e-05, -2.1219253540039062e-05, -1.4543533325195312e-05, -7.867813110351562e-06, -1.1920928955078125e-06, 5.4836273193359375e-06, 1.2159347534179688e-05, 1.8835067749023438e-05, 2.5510787963867188e-05, 3.218650817871094e-05, 3.886222839355469e-05, 4.553794860839844e-05, 5.221366882324219e-05, 5.888938903808594e-05, 6.556510925292969e-05, 7.224082946777344e-05, 7.891654968261719e-05, 8.559226989746094e-05, 9.226799011230469e-05, 9.894371032714844e-05, 0.00010561943054199219, 0.00011229515075683594, 0.00011897087097167969, 0.00012564659118652344, 0.0001323223114013672, 0.00013899803161621094, 0.0001456737518310547, 0.00015234947204589844, 0.0001590251922607422, 0.00016570091247558594, 0.0001723766326904297]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 7.0, 6.0, 12.0, 24.0, 18.0, 31.0, 52.0, 76.0, 124.0, 212.0, 383.0, 772.0, 1728.0, 4912.0, 20036.0, 145354.0, 694600.0, 150919.0, 20935.0, 4899.0, 1684.0, 807.0, 388.0, 217.0, 116.0, 77.0, 49.0, 35.0, 26.0, 17.0, 15.0, 1.0, 7.0, 9.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5048828125, -1.453887939453125, -1.40289306640625, -1.351898193359375, -1.3009033203125, -1.249908447265625, -1.19891357421875, -1.147918701171875, -1.096923828125, -1.045928955078125, -0.99493408203125, -0.943939208984375, -0.8929443359375, -0.841949462890625, -0.79095458984375, -0.739959716796875, -0.68896484375, -0.637969970703125, -0.58697509765625, -0.535980224609375, -0.4849853515625, -0.433990478515625, -0.38299560546875, -0.332000732421875, -0.281005859375, -0.230010986328125, -0.17901611328125, -0.128021240234375, -0.0770263671875, -0.026031494140625, 0.02496337890625, 0.075958251953125, 0.126953125, 0.177947998046875, 0.22894287109375, 0.279937744140625, 0.3309326171875, 0.381927490234375, 0.43292236328125, 0.483917236328125, 0.534912109375, 0.585906982421875, 0.63690185546875, 0.687896728515625, 0.7388916015625, 0.789886474609375, 0.84088134765625, 0.891876220703125, 0.94287109375, 0.993865966796875, 1.04486083984375, 1.095855712890625, 1.1468505859375, 1.197845458984375, 1.24884033203125, 1.299835205078125, 1.350830078125, 1.401824951171875, 1.45281982421875, 1.503814697265625, 1.5548095703125, 1.605804443359375, 1.65679931640625, 1.707794189453125, 1.7587890625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 6.0, 1.0, 9.0, 11.0, 20.0, 21.0, 42.0, 51.0, 60.0, 82.0, 95.0, 126.0, 113.0, 88.0, 58.0, 65.0, 50.0, 33.0, 24.0, 15.0, 4.0, 9.0, 13.0, 5.0, 3.0, 1.0, 1.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.87060546875, -0.8366470336914062, -0.8026885986328125, -0.7687301635742188, -0.734771728515625, -0.7008132934570312, -0.6668548583984375, -0.6328964233398438, -0.59893798828125, -0.5649795532226562, -0.5310211181640625, -0.49706268310546875, -0.463104248046875, -0.42914581298828125, -0.3951873779296875, -0.36122894287109375, -0.3272705078125, -0.29331207275390625, -0.2593536376953125, -0.22539520263671875, -0.191436767578125, -0.15747833251953125, -0.1235198974609375, -0.08956146240234375, -0.05560302734375, -0.02164459228515625, 0.0123138427734375, 0.04627227783203125, 0.080230712890625, 0.11418914794921875, 0.1481475830078125, 0.18210601806640625, 0.216064453125, 0.25002288818359375, 0.2839813232421875, 0.31793975830078125, 0.351898193359375, 0.38585662841796875, 0.4198150634765625, 0.45377349853515625, 0.48773193359375, 0.5216903686523438, 0.5556488037109375, 0.5896072387695312, 0.623565673828125, 0.6575241088867188, 0.6914825439453125, 0.7254409790039062, 0.7593994140625, 0.7933578491210938, 0.8273162841796875, 0.8612747192382812, 0.895233154296875, 0.9291915893554688, 0.9631500244140625, 0.9971084594726562, 1.03106689453125, 1.0650253295898438, 1.0989837646484375, 1.1329421997070312, 1.166900634765625, 1.2008590698242188, 1.2348175048828125, 1.2687759399414062, 1.302734375]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 15.0, 11.0, 46.0, 88.0, 124.0, 189.0, 192.0, 151.0, 86.0, 50.0, 24.0, 13.0, 9.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.194259643554688, -22.491138458251953, -21.788015365600586, -21.08489418029785, -20.381772994995117, -19.678651809692383, -18.975528717041016, -18.27240753173828, -17.569286346435547, -16.866165161132812, -16.163042068481445, -15.459920883178711, -14.756799697875977, -14.053677558898926, -13.350555419921875, -12.64743423461914, -11.94431209564209, -11.241189956665039, -10.538068771362305, -9.834946632385254, -9.13182544708252, -8.428703308105469, -7.725581645965576, -7.022459983825684, -6.319338321685791, -5.616216659545898, -4.913094997406006, -4.209973335266113, -3.5068514347076416, -2.803729772567749, -2.1006078720092773, -1.3974862098693848, -0.6943645477294922, 0.008757174015045166, 0.7118788957595825, 1.4150006771087646, 2.1181223392486572, 2.82124400138855, 3.5243659019470215, 4.227487564086914, 4.930609226226807, 5.633730888366699, 6.336852550506592, 7.039974212646484, 7.743096351623535, 8.44621753692627, 9.14933967590332, 9.852460861206055, 10.555583000183105, 11.258705139160156, 11.96182632446289, 12.664948463439941, 13.368069648742676, 14.071191787719727, 14.774312973022461, 15.477435111999512, 16.180557250976562, 16.883678436279297, 17.586801528930664, 18.2899227142334, 18.993043899536133, 19.696165084838867, 20.399288177490234, 21.10240936279297, 21.805530548095703]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 9.0, 6.0, 10.0, 10.0, 11.0, 22.0, 16.0, 22.0, 25.0, 22.0, 30.0, 30.0, 34.0, 36.0, 48.0, 43.0, 39.0, 58.0, 54.0, 48.0, 57.0, 50.0, 35.0, 28.0, 30.0, 26.0, 38.0, 26.0, 21.0, 19.0, 15.0, 16.0, 14.0, 11.0, 7.0, 8.0, 9.0, 6.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-14.616498947143555, -14.191328048706055, -13.766157150268555, -13.340985298156738, -12.915814399719238, -12.490643501281738, -12.065471649169922, -11.640300750732422, -11.215129852294922, -10.789958953857422, -10.364788055419922, -9.939616203308105, -9.514445304870605, -9.089274406433105, -8.664102554321289, -8.238931655883789, -7.813760757446289, -7.388589859008789, -6.963418483734131, -6.538247108459473, -6.113076210021973, -5.687905311584473, -5.2627339363098145, -4.837562561035156, -4.412391662597656, -3.987220525741577, -3.562049388885498, -3.136878252029419, -2.71170711517334, -2.2865359783172607, -1.8613648414611816, -1.4361937046051025, -1.0110235214233398, -0.5858523845672607, -0.16068124771118164, 0.26448988914489746, 0.6896610260009766, 1.1148321628570557, 1.5400032997131348, 1.9651744365692139, 2.390345573425293, 2.815516710281372, 3.240687847137451, 3.6658589839935303, 4.091030120849609, 4.516201019287109, 4.941372394561768, 5.366543769836426, 5.791714668273926, 6.216885566711426, 6.642056941986084, 7.067228317260742, 7.492399215698242, 7.917570114135742, 8.342741012573242, 8.767912864685059, 9.193083763122559, 9.618254661560059, 10.043426513671875, 10.468597412109375, 10.893768310546875, 11.318939208984375, 11.744110107421875, 12.169281959533691, 12.594452857971191]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 5.0, 2.0, 1.0, 1.0, 2.0, 4.0, 7.0, 4.0, 7.0, 14.0, 14.0, 20.0, 18.0, 39.0, 45.0, 59.0, 103.0, 127.0, 243.0, 373.0, 783.0, 1970.0, 6302.0, 36076.0, 3431352.0, 681953.0, 26540.0, 5107.0, 1685.0, 657.0, 318.0, 197.0, 88.0, 56.0, 25.0, 22.0, 21.0, 15.0, 10.0, 9.0, 4.0, 6.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.85546875, -5.6776123046875, -5.499755859375, -5.3218994140625, -5.14404296875, -4.9661865234375, -4.788330078125, -4.6104736328125, -4.4326171875, -4.2547607421875, -4.076904296875, -3.8990478515625, -3.72119140625, -3.5433349609375, -3.365478515625, -3.1876220703125, -3.009765625, -2.8319091796875, -2.654052734375, -2.4761962890625, -2.29833984375, -2.1204833984375, -1.942626953125, -1.7647705078125, -1.5869140625, -1.4090576171875, -1.231201171875, -1.0533447265625, -0.87548828125, -0.6976318359375, -0.519775390625, -0.3419189453125, -0.1640625, 0.0137939453125, 0.191650390625, 0.3695068359375, 0.54736328125, 0.7252197265625, 0.903076171875, 1.0809326171875, 1.2587890625, 1.4366455078125, 1.614501953125, 1.7923583984375, 1.97021484375, 2.1480712890625, 2.325927734375, 2.5037841796875, 2.681640625, 2.8594970703125, 3.037353515625, 3.2152099609375, 3.39306640625, 3.5709228515625, 3.748779296875, 3.9266357421875, 4.1044921875, 4.2823486328125, 4.460205078125, 4.6380615234375, 4.81591796875, 4.9937744140625, 5.171630859375, 5.3494873046875, 5.52734375]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 5.0, 12.0, 32.0, 53.0, 58.0, 78.0, 89.0, 112.0, 103.0, 118.0, 103.0, 75.0, 59.0, 43.0, 24.0, 16.0, 5.0, 6.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.8779296875, -1.833648681640625, -1.78936767578125, -1.745086669921875, -1.7008056640625, -1.656524658203125, -1.61224365234375, -1.567962646484375, -1.523681640625, -1.479400634765625, -1.43511962890625, -1.390838623046875, -1.3465576171875, -1.302276611328125, -1.25799560546875, -1.213714599609375, -1.16943359375, -1.125152587890625, -1.08087158203125, -1.036590576171875, -0.9923095703125, -0.948028564453125, -0.90374755859375, -0.859466552734375, -0.815185546875, -0.770904541015625, -0.72662353515625, -0.682342529296875, -0.6380615234375, -0.593780517578125, -0.54949951171875, -0.505218505859375, -0.4609375, -0.416656494140625, -0.37237548828125, -0.328094482421875, -0.2838134765625, -0.239532470703125, -0.19525146484375, -0.150970458984375, -0.106689453125, -0.062408447265625, -0.01812744140625, 0.026153564453125, 0.0704345703125, 0.114715576171875, 0.15899658203125, 0.203277587890625, 0.24755859375, 0.291839599609375, 0.33612060546875, 0.380401611328125, 0.4246826171875, 0.468963623046875, 0.51324462890625, 0.557525634765625, 0.601806640625, 0.646087646484375, 0.69036865234375, 0.734649658203125, 0.7789306640625, 0.823211669921875, 0.86749267578125, 0.911773681640625, 0.9560546875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 4.0, 8.0, 9.0, 19.0, 21.0, 39.0, 58.0, 90.0, 173.0, 355.0, 1129.0, 6606.0, 120752.0, 4008797.0, 50355.0, 4257.0, 916.0, 332.0, 145.0, 88.0, 45.0, 31.0, 22.0, 13.0, 10.0, 6.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.2265625, -7.9940185546875, -7.761474609375, -7.5289306640625, -7.29638671875, -7.0638427734375, -6.831298828125, -6.5987548828125, -6.3662109375, -6.1336669921875, -5.901123046875, -5.6685791015625, -5.43603515625, -5.2034912109375, -4.970947265625, -4.7384033203125, -4.505859375, -4.2733154296875, -4.040771484375, -3.8082275390625, -3.57568359375, -3.3431396484375, -3.110595703125, -2.8780517578125, -2.6455078125, -2.4129638671875, -2.180419921875, -1.9478759765625, -1.71533203125, -1.4827880859375, -1.250244140625, -1.0177001953125, -0.78515625, -0.5526123046875, -0.320068359375, -0.0875244140625, 0.14501953125, 0.3775634765625, 0.610107421875, 0.8426513671875, 1.0751953125, 1.3077392578125, 1.540283203125, 1.7728271484375, 2.00537109375, 2.2379150390625, 2.470458984375, 2.7030029296875, 2.935546875, 3.1680908203125, 3.400634765625, 3.6331787109375, 3.86572265625, 4.0982666015625, 4.330810546875, 4.5633544921875, 4.7958984375, 5.0284423828125, 5.260986328125, 5.4935302734375, 5.72607421875, 5.9586181640625, 6.191162109375, 6.4237060546875, 6.65625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 8.0, 12.0, 20.0, 29.0, 52.0, 87.0, 191.0, 660.0, 2237.0, 415.0, 164.0, 68.0, 53.0, 24.0, 22.0, 11.0, 10.0, 3.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.740234375, -1.6880035400390625, -1.635772705078125, -1.5835418701171875, -1.53131103515625, -1.4790802001953125, -1.426849365234375, -1.3746185302734375, -1.3223876953125, -1.2701568603515625, -1.217926025390625, -1.1656951904296875, -1.11346435546875, -1.0612335205078125, -1.009002685546875, -0.9567718505859375, -0.904541015625, -0.8523101806640625, -0.800079345703125, -0.7478485107421875, -0.69561767578125, -0.6433868408203125, -0.591156005859375, -0.5389251708984375, -0.4866943359375, -0.4344635009765625, -0.382232666015625, -0.3300018310546875, -0.27777099609375, -0.2255401611328125, -0.173309326171875, -0.1210784912109375, -0.06884765625, -0.0166168212890625, 0.035614013671875, 0.0878448486328125, 0.14007568359375, 0.1923065185546875, 0.244537353515625, 0.2967681884765625, 0.3489990234375, 0.4012298583984375, 0.453460693359375, 0.5056915283203125, 0.55792236328125, 0.6101531982421875, 0.662384033203125, 0.7146148681640625, 0.766845703125, 0.8190765380859375, 0.871307373046875, 0.9235382080078125, 0.97576904296875, 1.0279998779296875, 1.080230712890625, 1.1324615478515625, 1.1846923828125, 1.2369232177734375, 1.289154052734375, 1.3413848876953125, 1.39361572265625, 1.4458465576171875, 1.498077392578125, 1.5503082275390625, 1.6025390625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 11.0, 17.0, 39.0, 124.0, 200.0, 235.0, 211.0, 89.0, 41.0, 19.0, 5.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.390524864196777, -10.022367477416992, -9.654211044311523, -9.286053657531738, -8.917896270751953, -8.549738883972168, -8.181581497192383, -7.813425064086914, -7.445267677307129, -7.077110290527344, -6.708953380584717, -6.34079647064209, -5.972639083862305, -5.6044816970825195, -5.236324787139893, -4.868167877197266, -4.5000104904174805, -4.131853103637695, -3.7636961936950684, -3.3955390453338623, -3.0273818969726562, -2.65922474861145, -2.291067600250244, -1.922910451889038, -1.554753303527832, -1.186596155166626, -0.8184390068054199, -0.45028185844421387, -0.08212471008300781, 0.28603243827819824, 0.6541895866394043, 1.0223467350006104, 1.3905029296875, 1.758660078048706, 2.126817226409912, 2.494974374771118, 2.863131523132324, 3.2312886714935303, 3.5994458198547363, 3.9676029682159424, 4.335760116577148, 4.703917503356934, 5.0720744132995605, 5.4402313232421875, 5.808388710021973, 6.176546096801758, 6.544703006744385, 6.912859916687012, 7.281017303466797, 7.649174690246582, 8.017332077026367, 8.385488510131836, 8.753645896911621, 9.121803283691406, 9.489959716796875, 9.85811710357666, 10.226274490356445, 10.59443187713623, 10.962589263916016, 11.330745697021484, 11.69890308380127, 12.067060470581055, 12.435216903686523, 12.803374290466309, 13.171531677246094]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 7.0, 5.0, 8.0, 7.0, 10.0, 8.0, 10.0, 8.0, 17.0, 14.0, 18.0, 16.0, 30.0, 28.0, 40.0, 35.0, 43.0, 56.0, 42.0, 44.0, 44.0, 47.0, 40.0, 42.0, 48.0, 33.0, 32.0, 44.0, 30.0, 29.0, 19.0, 26.0, 20.0, 18.0, 20.0, 12.0, 13.0, 8.0, 7.0, 9.0, 3.0, 6.0, 2.0, 4.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.454960584640503, -3.342747449874878, -3.230534076690674, -3.118320941925049, -3.006107807159424, -2.893894672393799, -2.7816812992095947, -2.6694681644439697, -2.5572547912597656, -2.4450416564941406, -2.3328282833099365, -2.2206151485443115, -2.1084020137786865, -1.996188759803772, -1.8839755058288574, -1.7717623710632324, -1.6595492362976074, -1.5473359823226929, -1.4351228475570679, -1.3229095935821533, -1.2106964588165283, -1.0984832048416138, -0.9862699508666992, -0.8740567564964294, -0.7618435621261597, -0.6496303677558899, -0.5374171733856201, -0.42520391941070557, -0.3129907250404358, -0.20077753067016602, -0.08856427669525146, 0.02364891767501831, 0.13586211204528809, 0.24807532131671906, 0.36028853058815, 0.4725017547607422, 0.584714949131012, 0.6969281435012817, 0.8091413974761963, 0.9213545918464661, 1.0335677862167358, 1.1457810401916504, 1.2579941749572754, 1.37020742893219, 1.4824206829071045, 1.5946338176727295, 1.706847071647644, 1.8190603256225586, 1.9312734603881836, 2.0434865951538086, 2.1556999683380127, 2.2679131031036377, 2.3801262378692627, 2.492339611053467, 2.604552745819092, 2.716765880584717, 2.828979015350342, 2.941192150115967, 3.053405523300171, 3.165618658065796, 3.277831792831421, 3.390045166015625, 3.50225830078125, 3.614471435546875, 3.726684808731079]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 6.0, 10.0, 12.0, 12.0, 25.0, 27.0, 58.0, 91.0, 216.0, 428.0, 1129.0, 3863.0, 27473.0, 491954.0, 490046.0, 27379.0, 3809.0, 1112.0, 452.0, 194.0, 97.0, 53.0, 41.0, 33.0, 14.0, 9.0, 5.0, 6.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.078125, -6.84979248046875, -6.6214599609375, -6.39312744140625, -6.164794921875, -5.93646240234375, -5.7081298828125, -5.47979736328125, -5.25146484375, -5.02313232421875, -4.7947998046875, -4.56646728515625, -4.338134765625, -4.10980224609375, -3.8814697265625, -3.65313720703125, -3.4248046875, -3.19647216796875, -2.9681396484375, -2.73980712890625, -2.511474609375, -2.28314208984375, -2.0548095703125, -1.82647705078125, -1.59814453125, -1.36981201171875, -1.1414794921875, -0.91314697265625, -0.684814453125, -0.45648193359375, -0.2281494140625, 0.00018310546875, 0.228515625, 0.45684814453125, 0.6851806640625, 0.91351318359375, 1.141845703125, 1.37017822265625, 1.5985107421875, 1.82684326171875, 2.05517578125, 2.28350830078125, 2.5118408203125, 2.74017333984375, 2.968505859375, 3.19683837890625, 3.4251708984375, 3.65350341796875, 3.8818359375, 4.11016845703125, 4.3385009765625, 4.56683349609375, 4.795166015625, 5.02349853515625, 5.2518310546875, 5.48016357421875, 5.70849609375, 5.93682861328125, 6.1651611328125, 6.39349365234375, 6.621826171875, 6.85015869140625, 7.0784912109375, 7.30682373046875, 7.53515625]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 7.0, 10.0, 36.0, 45.0, 55.0, 90.0, 88.0, 94.0, 125.0, 109.0, 92.0, 82.0, 61.0, 45.0, 30.0, 12.0, 6.0, 1.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.8310546875, -1.78790283203125, -1.7447509765625, -1.70159912109375, -1.658447265625, -1.61529541015625, -1.5721435546875, -1.52899169921875, -1.48583984375, -1.44268798828125, -1.3995361328125, -1.35638427734375, -1.313232421875, -1.27008056640625, -1.2269287109375, -1.18377685546875, -1.140625, -1.09747314453125, -1.0543212890625, -1.01116943359375, -0.968017578125, -0.92486572265625, -0.8817138671875, -0.83856201171875, -0.79541015625, -0.75225830078125, -0.7091064453125, -0.66595458984375, -0.622802734375, -0.57965087890625, -0.5364990234375, -0.49334716796875, -0.4501953125, -0.40704345703125, -0.3638916015625, -0.32073974609375, -0.277587890625, -0.23443603515625, -0.1912841796875, -0.14813232421875, -0.10498046875, -0.06182861328125, -0.0186767578125, 0.02447509765625, 0.067626953125, 0.11077880859375, 0.1539306640625, 0.19708251953125, 0.240234375, 0.28338623046875, 0.3265380859375, 0.36968994140625, 0.412841796875, 0.45599365234375, 0.4991455078125, 0.54229736328125, 0.58544921875, 0.62860107421875, 0.6717529296875, 0.71490478515625, 0.758056640625, 0.80120849609375, 0.8443603515625, 0.88751220703125, 0.9306640625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 4.0, 3.0, 4.0, 7.0, 3.0, 5.0, 12.0, 19.0, 17.0, 24.0, 33.0, 47.0, 58.0, 112.0, 155.0, 253.0, 488.0, 913.0, 2083.0, 4831.0, 13814.0, 42697.0, 151138.0, 422199.0, 287255.0, 83293.0, 24698.0, 8237.0, 3184.0, 1348.0, 667.0, 360.0, 200.0, 117.0, 67.0, 65.0, 40.0, 30.0, 24.0, 17.0, 7.0, 8.0, 8.0, 1.0, 7.0, 3.0, 4.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.171875, -2.098907470703125, -2.02593994140625, -1.952972412109375, -1.8800048828125, -1.807037353515625, -1.73406982421875, -1.661102294921875, -1.588134765625, -1.515167236328125, -1.44219970703125, -1.369232177734375, -1.2962646484375, -1.223297119140625, -1.15032958984375, -1.077362060546875, -1.00439453125, -0.931427001953125, -0.85845947265625, -0.785491943359375, -0.7125244140625, -0.639556884765625, -0.56658935546875, -0.493621826171875, -0.420654296875, -0.347686767578125, -0.27471923828125, -0.201751708984375, -0.1287841796875, -0.055816650390625, 0.01715087890625, 0.090118408203125, 0.1630859375, 0.236053466796875, 0.30902099609375, 0.381988525390625, 0.4549560546875, 0.527923583984375, 0.60089111328125, 0.673858642578125, 0.746826171875, 0.819793701171875, 0.89276123046875, 0.965728759765625, 1.0386962890625, 1.111663818359375, 1.18463134765625, 1.257598876953125, 1.33056640625, 1.403533935546875, 1.47650146484375, 1.549468994140625, 1.6224365234375, 1.695404052734375, 1.76837158203125, 1.841339111328125, 1.914306640625, 1.987274169921875, 2.06024169921875, 2.133209228515625, 2.2061767578125, 2.279144287109375, 2.35211181640625, 2.425079345703125, 2.498046875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 4.0, 3.0, 4.0, 1.0, 4.0, 6.0, 10.0, 6.0, 12.0, 7.0, 22.0, 18.0, 16.0, 29.0, 23.0, 16.0, 26.0, 32.0, 37.0, 34.0, 41.0, 39.0, 34.0, 41.0, 45.0, 25.0, 43.0, 42.0, 28.0, 34.0, 35.0, 35.0, 34.0, 30.0, 29.0, 24.0, 22.0, 20.0, 16.0, 14.0, 17.0, 14.0, 10.0, 6.0, 6.0, 7.0, 4.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.03125, -1.962860107421875, -1.89447021484375, -1.826080322265625, -1.7576904296875, -1.689300537109375, -1.62091064453125, -1.552520751953125, -1.484130859375, -1.415740966796875, -1.34735107421875, -1.278961181640625, -1.2105712890625, -1.142181396484375, -1.07379150390625, -1.005401611328125, -0.93701171875, -0.868621826171875, -0.80023193359375, -0.731842041015625, -0.6634521484375, -0.595062255859375, -0.52667236328125, -0.458282470703125, -0.389892578125, -0.321502685546875, -0.25311279296875, -0.184722900390625, -0.1163330078125, -0.047943115234375, 0.02044677734375, 0.088836669921875, 0.1572265625, 0.225616455078125, 0.29400634765625, 0.362396240234375, 0.4307861328125, 0.499176025390625, 0.56756591796875, 0.635955810546875, 0.704345703125, 0.772735595703125, 0.84112548828125, 0.909515380859375, 0.9779052734375, 1.046295166015625, 1.11468505859375, 1.183074951171875, 1.25146484375, 1.319854736328125, 1.38824462890625, 1.456634521484375, 1.5250244140625, 1.593414306640625, 1.66180419921875, 1.730194091796875, 1.798583984375, 1.866973876953125, 1.93536376953125, 2.003753662109375, 2.0721435546875, 2.140533447265625, 2.20892333984375, 2.277313232421875, 2.345703125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 2.0, 5.0, 8.0, 9.0, 13.0, 15.0, 31.0, 49.0, 103.0, 180.0, 450.0, 1558.0, 11014.0, 981648.0, 49522.0, 2765.0, 642.0, 247.0, 111.0, 70.0, 35.0, 28.0, 10.0, 7.0, 10.0, 8.0, 4.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.33203125, -6.12567138671875, -5.9193115234375, -5.71295166015625, -5.506591796875, -5.30023193359375, -5.0938720703125, -4.88751220703125, -4.68115234375, -4.47479248046875, -4.2684326171875, -4.06207275390625, -3.855712890625, -3.64935302734375, -3.4429931640625, -3.23663330078125, -3.0302734375, -2.82391357421875, -2.6175537109375, -2.41119384765625, -2.204833984375, -1.99847412109375, -1.7921142578125, -1.58575439453125, -1.37939453125, -1.17303466796875, -0.9666748046875, -0.76031494140625, -0.553955078125, -0.34759521484375, -0.1412353515625, 0.06512451171875, 0.271484375, 0.47784423828125, 0.6842041015625, 0.89056396484375, 1.096923828125, 1.30328369140625, 1.5096435546875, 1.71600341796875, 1.92236328125, 2.12872314453125, 2.3350830078125, 2.54144287109375, 2.747802734375, 2.95416259765625, 3.1605224609375, 3.36688232421875, 3.5732421875, 3.77960205078125, 3.9859619140625, 4.19232177734375, 4.398681640625, 4.60504150390625, 4.8114013671875, 5.01776123046875, 5.22412109375, 5.43048095703125, 5.6368408203125, 5.84320068359375, 6.049560546875, 6.25592041015625, 6.4622802734375, 6.66864013671875, 6.875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 13.0, 35.0, 137.0, 449.0, 243.0, 75.0, 22.0, 12.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006699562072753906, -0.0006321743130683899, -0.0005943924188613892, -0.0005566105246543884, -0.0005188286304473877, -0.00048104673624038696, -0.00044326484203338623, -0.0004054829478263855, -0.00036770105361938477, -0.00032991915941238403, -0.0002921372652053833, -0.00025435537099838257, -0.00021657347679138184, -0.0001787915825843811, -0.00014100968837738037, -0.00010322779417037964, -6.54458999633789e-05, -2.7664005756378174e-05, 1.0117888450622559e-05, 4.789978265762329e-05, 8.568167686462402e-05, 0.00012346357107162476, 0.0001612454652786255, 0.00019902735948562622, 0.00023680925369262695, 0.0002745911478996277, 0.0003123730421066284, 0.00035015493631362915, 0.0003879368305206299, 0.0004257187247276306, 0.00046350061893463135, 0.0005012825131416321, 0.0005390644073486328, 0.0005768463015556335, 0.0006146281957626343, 0.000652410089969635, 0.0006901919841766357, 0.0007279738783836365, 0.0007657557725906372, 0.0008035376667976379, 0.0008413195610046387, 0.0008791014552116394, 0.0009168833494186401, 0.0009546652436256409, 0.0009924471378326416, 0.0010302290320396423, 0.001068010926246643, 0.0011057928204536438, 0.0011435747146606445, 0.0011813566088676453, 0.001219138503074646, 0.0012569203972816467, 0.0012947022914886475, 0.0013324841856956482, 0.001370266079902649, 0.0014080479741096497, 0.0014458298683166504, 0.0014836117625236511, 0.0015213936567306519, 0.0015591755509376526, 0.0015969574451446533, 0.001634739339351654, 0.0016725212335586548, 0.0017103031277656555, 0.0017480850219726562]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 7.0, 10.0, 13.0, 22.0, 32.0, 56.0, 84.0, 172.0, 404.0, 1626.0, 16409.0, 997679.0, 29120.0, 2072.0, 429.0, 154.0, 87.0, 54.0, 38.0, 22.0, 15.0, 19.0, 16.0, 4.0, 5.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.515625, -7.32568359375, -7.1357421875, -6.94580078125, -6.755859375, -6.56591796875, -6.3759765625, -6.18603515625, -5.99609375, -5.80615234375, -5.6162109375, -5.42626953125, -5.236328125, -5.04638671875, -4.8564453125, -4.66650390625, -4.4765625, -4.28662109375, -4.0966796875, -3.90673828125, -3.716796875, -3.52685546875, -3.3369140625, -3.14697265625, -2.95703125, -2.76708984375, -2.5771484375, -2.38720703125, -2.197265625, -2.00732421875, -1.8173828125, -1.62744140625, -1.4375, -1.24755859375, -1.0576171875, -0.86767578125, -0.677734375, -0.48779296875, -0.2978515625, -0.10791015625, 0.08203125, 0.27197265625, 0.4619140625, 0.65185546875, 0.841796875, 1.03173828125, 1.2216796875, 1.41162109375, 1.6015625, 1.79150390625, 1.9814453125, 2.17138671875, 2.361328125, 2.55126953125, 2.7412109375, 2.93115234375, 3.12109375, 3.31103515625, 3.5009765625, 3.69091796875, 3.880859375, 4.07080078125, 4.2607421875, 4.45068359375, 4.640625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 6.0, 5.0, 13.0, 14.0, 31.0, 61.0, 116.0, 184.0, 228.0, 176.0, 93.0, 41.0, 22.0, 4.0, 7.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.384765625, -1.304840087890625, -1.22491455078125, -1.144989013671875, -1.0650634765625, -0.985137939453125, -0.90521240234375, -0.825286865234375, -0.745361328125, -0.665435791015625, -0.58551025390625, -0.505584716796875, -0.4256591796875, -0.345733642578125, -0.26580810546875, -0.185882568359375, -0.10595703125, -0.026031494140625, 0.05389404296875, 0.133819580078125, 0.2137451171875, 0.293670654296875, 0.37359619140625, 0.453521728515625, 0.533447265625, 0.613372802734375, 0.69329833984375, 0.773223876953125, 0.8531494140625, 0.933074951171875, 1.01300048828125, 1.092926025390625, 1.1728515625, 1.252777099609375, 1.33270263671875, 1.412628173828125, 1.4925537109375, 1.572479248046875, 1.65240478515625, 1.732330322265625, 1.812255859375, 1.892181396484375, 1.97210693359375, 2.052032470703125, 2.1319580078125, 2.211883544921875, 2.29180908203125, 2.371734619140625, 2.45166015625, 2.531585693359375, 2.61151123046875, 2.691436767578125, 2.7713623046875, 2.851287841796875, 2.93121337890625, 3.011138916015625, 3.091064453125, 3.170989990234375, 3.25091552734375, 3.330841064453125, 3.4107666015625, 3.490692138671875, 3.57061767578125, 3.650543212890625, 3.73046875]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 12.0, 21.0, 47.0, 157.0, 274.0, 253.0, 155.0, 57.0, 18.0, 7.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.04229736328125, -25.812040328979492, -24.581783294677734, -23.351524353027344, -22.121267318725586, -20.891010284423828, -19.660751342773438, -18.43049430847168, -17.200237274169922, -15.969980239868164, -14.73972225189209, -13.509464263916016, -12.279207229614258, -11.0489501953125, -9.818692207336426, -8.588434219360352, -7.358177185058594, -6.127919673919678, -4.897662162780762, -3.6674046516418457, -2.4371471405029297, -1.2068896293640137, 0.023367881774902344, 1.2536258697509766, 2.4838829040527344, 3.7141404151916504, 4.944397926330566, 6.174655437469482, 7.404912948608398, 8.635169982910156, 9.86542797088623, 11.095685958862305, 12.325946807861328, 13.556203842163086, 14.78646183013916, 16.016719818115234, 17.246976852416992, 18.47723388671875, 19.70749282836914, 20.9377498626709, 22.168006896972656, 23.398263931274414, 24.628520965576172, 25.858779907226562, 27.08903694152832, 28.319293975830078, 29.54955291748047, 30.779809951782227, 32.010066986083984, 33.240325927734375, 34.4705810546875, 35.70083999633789, 36.93109893798828, 38.161354064941406, 39.3916130065918, 40.62187194824219, 41.85212707519531, 43.0823860168457, 44.31264114379883, 45.54290008544922, 46.773155212402344, 48.003414154052734, 49.233673095703125, 50.46392822265625, 51.69418716430664]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 6.0, 2.0, 5.0, 7.0, 8.0, 4.0, 6.0, 14.0, 8.0, 20.0, 15.0, 22.0, 21.0, 36.0, 20.0, 38.0, 39.0, 40.0, 33.0, 37.0, 36.0, 41.0, 42.0, 44.0, 41.0, 46.0, 29.0, 33.0, 26.0, 35.0, 25.0, 26.0, 33.0, 30.0, 25.0, 16.0, 12.0, 16.0, 19.0, 15.0, 9.0, 5.0, 5.0, 7.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-13.662406921386719, -13.273585319519043, -12.88476276397705, -12.495941162109375, -12.1071195602417, -11.718297958374023, -11.329475402832031, -10.940653800964355, -10.55183219909668, -10.163010597229004, -9.774188041687012, -9.385366439819336, -8.99654483795166, -8.607723236083984, -8.218900680541992, -7.830079078674316, -7.441256523132324, -7.05243444442749, -6.6636128425598145, -6.2747907638549805, -5.885969161987305, -5.497147083282471, -5.108325004577637, -4.719503402709961, -4.330681324005127, -3.941859483718872, -3.553037643432617, -3.164215564727783, -2.7753937244415283, -2.3865718841552734, -1.9977498054504395, -1.6089279651641846, -1.2201061248779297, -0.83128422498703, -0.44246232509613037, -0.05364036560058594, 0.33518147468566895, 0.7240033149719238, 1.1128253936767578, 1.5016472339630127, 1.8904690742492676, 2.2792909145355225, 2.6681127548217773, 3.0569348335266113, 3.445756673812866, 3.834578514099121, 4.223400592803955, 4.612222671508789, 5.001044273376465, 5.389866352081299, 5.778687953948975, 6.167510032653809, 6.556331634521484, 6.945153713226318, 7.333975791931152, 7.722797393798828, 8.11161994934082, 8.500441551208496, 8.889264106750488, 9.278085708618164, 9.66690731048584, 10.055728912353516, 10.444551467895508, 10.833373069763184, 11.22219467163086]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 5.0, 2.0, 3.0, 6.0, 8.0, 12.0, 18.0, 26.0, 33.0, 49.0, 104.0, 126.0, 194.0, 447.0, 1062.0, 2758.0, 11342.0, 132594.0, 3977784.0, 57063.0, 7170.0, 2016.0, 727.0, 324.0, 176.0, 90.0, 53.0, 32.0, 18.0, 17.0, 6.0, 3.0, 8.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-9.8671875, -9.62274169921875, -9.3782958984375, -9.13385009765625, -8.889404296875, -8.64495849609375, -8.4005126953125, -8.15606689453125, -7.91162109375, -7.66717529296875, -7.4227294921875, -7.17828369140625, -6.933837890625, -6.68939208984375, -6.4449462890625, -6.20050048828125, -5.9560546875, -5.71160888671875, -5.4671630859375, -5.22271728515625, -4.978271484375, -4.73382568359375, -4.4893798828125, -4.24493408203125, -4.00048828125, -3.75604248046875, -3.5115966796875, -3.26715087890625, -3.022705078125, -2.77825927734375, -2.5338134765625, -2.28936767578125, -2.044921875, -1.80047607421875, -1.5560302734375, -1.31158447265625, -1.067138671875, -0.82269287109375, -0.5782470703125, -0.33380126953125, -0.08935546875, 0.15509033203125, 0.3995361328125, 0.64398193359375, 0.888427734375, 1.13287353515625, 1.3773193359375, 1.62176513671875, 1.8662109375, 2.11065673828125, 2.3551025390625, 2.59954833984375, 2.843994140625, 3.08843994140625, 3.3328857421875, 3.57733154296875, 3.82177734375, 4.06622314453125, 4.3106689453125, 4.55511474609375, 4.799560546875, 5.04400634765625, 5.2884521484375, 5.53289794921875, 5.77734375]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 5.0, 6.0, 11.0, 18.0, 21.0, 37.0, 43.0, 47.0, 66.0, 75.0, 99.0, 69.0, 110.0, 98.0, 77.0, 65.0, 51.0, 43.0, 22.0, 11.0, 14.0, 9.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.7119140625, -1.671844482421875, -1.63177490234375, -1.591705322265625, -1.5516357421875, -1.511566162109375, -1.47149658203125, -1.431427001953125, -1.391357421875, -1.351287841796875, -1.31121826171875, -1.271148681640625, -1.2310791015625, -1.191009521484375, -1.15093994140625, -1.110870361328125, -1.07080078125, -1.030731201171875, -0.99066162109375, -0.950592041015625, -0.9105224609375, -0.870452880859375, -0.83038330078125, -0.790313720703125, -0.750244140625, -0.710174560546875, -0.67010498046875, -0.630035400390625, -0.5899658203125, -0.549896240234375, -0.50982666015625, -0.469757080078125, -0.4296875, -0.389617919921875, -0.34954833984375, -0.309478759765625, -0.2694091796875, -0.229339599609375, -0.18927001953125, -0.149200439453125, -0.109130859375, -0.069061279296875, -0.02899169921875, 0.011077880859375, 0.0511474609375, 0.091217041015625, 0.13128662109375, 0.171356201171875, 0.21142578125, 0.251495361328125, 0.29156494140625, 0.331634521484375, 0.3717041015625, 0.411773681640625, 0.45184326171875, 0.491912841796875, 0.531982421875, 0.572052001953125, 0.61212158203125, 0.652191162109375, 0.6922607421875, 0.732330322265625, 0.77239990234375, 0.812469482421875, 0.8525390625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 4.0, 7.0, 20.0, 26.0, 31.0, 39.0, 79.0, 142.0, 259.0, 546.0, 1655.0, 6683.0, 45476.0, 3299172.0, 803336.0, 29295.0, 5169.0, 1403.0, 474.0, 199.0, 99.0, 62.0, 39.0, 31.0, 17.0, 5.0, 7.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.72265625, -5.5374755859375, -5.352294921875, -5.1671142578125, -4.98193359375, -4.7967529296875, -4.611572265625, -4.4263916015625, -4.2412109375, -4.0560302734375, -3.870849609375, -3.6856689453125, -3.50048828125, -3.3153076171875, -3.130126953125, -2.9449462890625, -2.759765625, -2.5745849609375, -2.389404296875, -2.2042236328125, -2.01904296875, -1.8338623046875, -1.648681640625, -1.4635009765625, -1.2783203125, -1.0931396484375, -0.907958984375, -0.7227783203125, -0.53759765625, -0.3524169921875, -0.167236328125, 0.0179443359375, 0.203125, 0.3883056640625, 0.573486328125, 0.7586669921875, 0.94384765625, 1.1290283203125, 1.314208984375, 1.4993896484375, 1.6845703125, 1.8697509765625, 2.054931640625, 2.2401123046875, 2.42529296875, 2.6104736328125, 2.795654296875, 2.9808349609375, 3.166015625, 3.3511962890625, 3.536376953125, 3.7215576171875, 3.90673828125, 4.0919189453125, 4.277099609375, 4.4622802734375, 4.6474609375, 4.8326416015625, 5.017822265625, 5.2030029296875, 5.38818359375, 5.5733642578125, 5.758544921875, 5.9437255859375, 6.12890625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 2.0, 5.0, 12.0, 11.0, 20.0, 16.0, 27.0, 47.0, 73.0, 121.0, 242.0, 730.0, 1768.0, 494.0, 213.0, 116.0, 55.0, 34.0, 19.0, 12.0, 10.0, 11.0, 12.0, 3.0, 5.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.794921875, -1.7426605224609375, -1.690399169921875, -1.6381378173828125, -1.58587646484375, -1.5336151123046875, -1.481353759765625, -1.4290924072265625, -1.3768310546875, -1.3245697021484375, -1.272308349609375, -1.2200469970703125, -1.16778564453125, -1.1155242919921875, -1.063262939453125, -1.0110015869140625, -0.958740234375, -0.9064788818359375, -0.854217529296875, -0.8019561767578125, -0.74969482421875, -0.6974334716796875, -0.645172119140625, -0.5929107666015625, -0.5406494140625, -0.4883880615234375, -0.436126708984375, -0.3838653564453125, -0.33160400390625, -0.2793426513671875, -0.227081298828125, -0.1748199462890625, -0.12255859375, -0.0702972412109375, -0.018035888671875, 0.0342254638671875, 0.08648681640625, 0.1387481689453125, 0.191009521484375, 0.2432708740234375, 0.2955322265625, 0.3477935791015625, 0.400054931640625, 0.4523162841796875, 0.50457763671875, 0.5568389892578125, 0.609100341796875, 0.6613616943359375, 0.713623046875, 0.7658843994140625, 0.818145751953125, 0.8704071044921875, 0.92266845703125, 0.9749298095703125, 1.027191162109375, 1.0794525146484375, 1.1317138671875, 1.1839752197265625, 1.236236572265625, 1.2884979248046875, 1.34075927734375, 1.3930206298828125, 1.445281982421875, 1.4975433349609375, 1.5498046875]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 2.0, 4.0, 9.0, 28.0, 83.0, 150.0, 275.0, 227.0, 126.0, 48.0, 26.0, 17.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.287155151367188, -18.804149627685547, -18.321142196655273, -17.838134765625, -17.35512924194336, -16.87212371826172, -16.389116287231445, -15.906109809875488, -15.423103332519531, -14.940096855163574, -14.457090377807617, -13.97408390045166, -13.491077423095703, -13.008070945739746, -12.525064468383789, -12.042057991027832, -11.559051513671875, -11.076045036315918, -10.593038558959961, -10.110032081604004, -9.627025604248047, -9.14401912689209, -8.661012649536133, -8.178006172180176, -7.694999694824219, -7.211993217468262, -6.728986740112305, -6.245980262756348, -5.762973785400391, -5.279967308044434, -4.796960830688477, -4.3139543533325195, -3.830946922302246, -3.347940444946289, -2.864933967590332, -2.381927490234375, -1.898921012878418, -1.415914535522461, -0.9329080581665039, -0.4499015808105469, 0.033104896545410156, 0.5161113739013672, 0.9991178512573242, 1.4821243286132812, 1.9651308059692383, 2.4481372833251953, 2.9311437606811523, 3.4141502380371094, 3.8971567153930664, 4.380163192749023, 4.8631696701049805, 5.3461761474609375, 5.8291826248168945, 6.312189102172852, 6.795195579528809, 7.278202056884766, 7.761208534240723, 8.24421501159668, 8.727221488952637, 9.210227966308594, 9.69323444366455, 10.176240921020508, 10.659247398376465, 11.142253875732422, 11.625260353088379]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 4.0, 7.0, 10.0, 9.0, 9.0, 14.0, 8.0, 29.0, 29.0, 25.0, 34.0, 39.0, 33.0, 35.0, 61.0, 42.0, 37.0, 54.0, 40.0, 36.0, 54.0, 44.0, 59.0, 41.0, 31.0, 30.0, 40.0, 34.0, 21.0, 23.0, 13.0, 10.0, 6.0, 10.0, 7.0, 7.0, 6.0, 5.0, 5.0, 2.0, 4.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.219407081604004, -5.058233261108398, -4.897059440612793, -4.735886096954346, -4.57471227645874, -4.413538455963135, -4.2523651123046875, -4.091191291809082, -3.9300174713134766, -3.768843650817871, -3.6076700687408447, -3.4464964866638184, -3.285322666168213, -3.1241488456726074, -2.962975263595581, -2.8018016815185547, -2.640627861022949, -2.4794540405273438, -2.3182804584503174, -2.157106876373291, -1.9959330558776855, -1.8347593545913696, -1.6735856533050537, -1.5124119520187378, -1.3512382507324219, -1.190064549446106, -1.02889084815979, -0.8677171468734741, -0.7065434455871582, -0.5453697443008423, -0.38419604301452637, -0.22302234172821045, -0.061849117279052734, 0.09932458400726318, 0.2604982852935791, 0.421671986579895, 0.5828456878662109, 0.7440193891525269, 0.9051930904388428, 1.0663667917251587, 1.2275404930114746, 1.3887141942977905, 1.5498878955841064, 1.7110615968704224, 1.8722352981567383, 2.0334091186523438, 2.19458270072937, 2.3557562828063965, 2.516930103302002, 2.6781039237976074, 2.839277505874634, 3.00045108795166, 3.1616249084472656, 3.322798728942871, 3.4839723110198975, 3.645145893096924, 3.8063197135925293, 3.9674935340881348, 4.128666877746582, 4.2898406982421875, 4.451014518737793, 4.612188339233398, 4.773362159729004, 4.934535503387451, 5.095709323883057]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 2.0, 7.0, 16.0, 15.0, 35.0, 42.0, 69.0, 129.0, 252.0, 615.0, 1739.0, 6324.0, 39882.0, 604331.0, 360631.0, 27096.0, 4881.0, 1392.0, 555.0, 226.0, 127.0, 62.0, 35.0, 20.0, 21.0, 15.0, 9.0, 9.0, 5.0, 5.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.26953125, -6.07305908203125, -5.8765869140625, -5.68011474609375, -5.483642578125, -5.28717041015625, -5.0906982421875, -4.89422607421875, -4.69775390625, -4.50128173828125, -4.3048095703125, -4.10833740234375, -3.911865234375, -3.71539306640625, -3.5189208984375, -3.32244873046875, -3.1259765625, -2.92950439453125, -2.7330322265625, -2.53656005859375, -2.340087890625, -2.14361572265625, -1.9471435546875, -1.75067138671875, -1.55419921875, -1.35772705078125, -1.1612548828125, -0.96478271484375, -0.768310546875, -0.57183837890625, -0.3753662109375, -0.17889404296875, 0.017578125, 0.21405029296875, 0.4105224609375, 0.60699462890625, 0.803466796875, 0.99993896484375, 1.1964111328125, 1.39288330078125, 1.58935546875, 1.78582763671875, 1.9822998046875, 2.17877197265625, 2.375244140625, 2.57171630859375, 2.7681884765625, 2.96466064453125, 3.1611328125, 3.35760498046875, 3.5540771484375, 3.75054931640625, 3.947021484375, 4.14349365234375, 4.3399658203125, 4.53643798828125, 4.73291015625, 4.92938232421875, 5.1258544921875, 5.32232666015625, 5.518798828125, 5.71527099609375, 5.9117431640625, 6.10821533203125, 6.3046875]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 7.0, 7.0, 7.0, 21.0, 23.0, 22.0, 39.0, 63.0, 76.0, 94.0, 90.0, 94.0, 91.0, 79.0, 75.0, 75.0, 59.0, 23.0, 26.0, 14.0, 11.0, 3.0, 4.0, 0.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.796875, -1.7546463012695312, -1.7124176025390625, -1.6701889038085938, -1.627960205078125, -1.5857315063476562, -1.5435028076171875, -1.5012741088867188, -1.45904541015625, -1.4168167114257812, -1.3745880126953125, -1.3323593139648438, -1.290130615234375, -1.2479019165039062, -1.2056732177734375, -1.1634445190429688, -1.1212158203125, -1.0789871215820312, -1.0367584228515625, -0.9945297241210938, -0.952301025390625, -0.9100723266601562, -0.8678436279296875, -0.8256149291992188, -0.78338623046875, -0.7411575317382812, -0.6989288330078125, -0.6567001342773438, -0.614471435546875, -0.5722427368164062, -0.5300140380859375, -0.48778533935546875, -0.445556640625, -0.40332794189453125, -0.3610992431640625, -0.31887054443359375, -0.276641845703125, -0.23441314697265625, -0.1921844482421875, -0.14995574951171875, -0.10772705078125, -0.06549835205078125, -0.0232696533203125, 0.01895904541015625, 0.061187744140625, 0.10341644287109375, 0.1456451416015625, 0.18787384033203125, 0.2301025390625, 0.27233123779296875, 0.3145599365234375, 0.35678863525390625, 0.399017333984375, 0.44124603271484375, 0.4834747314453125, 0.5257034301757812, 0.56793212890625, 0.6101608276367188, 0.6523895263671875, 0.6946182250976562, 0.736846923828125, 0.7790756225585938, 0.8213043212890625, 0.8635330200195312, 0.90576171875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 3.0, 5.0, 3.0, 5.0, 9.0, 8.0, 17.0, 28.0, 26.0, 35.0, 54.0, 85.0, 99.0, 193.0, 339.0, 781.0, 2118.0, 7405.0, 35451.0, 272763.0, 624784.0, 83813.0, 14298.0, 3692.0, 1285.0, 543.0, 267.0, 146.0, 78.0, 54.0, 38.0, 36.0, 23.0, 18.0, 15.0, 6.0, 7.0, 7.0, 3.0, 5.0, 4.0, 5.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.359375, -3.2403564453125, -3.121337890625, -3.0023193359375, -2.88330078125, -2.7642822265625, -2.645263671875, -2.5262451171875, -2.4072265625, -2.2882080078125, -2.169189453125, -2.0501708984375, -1.93115234375, -1.8121337890625, -1.693115234375, -1.5740966796875, -1.455078125, -1.3360595703125, -1.217041015625, -1.0980224609375, -0.97900390625, -0.8599853515625, -0.740966796875, -0.6219482421875, -0.5029296875, -0.3839111328125, -0.264892578125, -0.1458740234375, -0.02685546875, 0.0921630859375, 0.211181640625, 0.3302001953125, 0.44921875, 0.5682373046875, 0.687255859375, 0.8062744140625, 0.92529296875, 1.0443115234375, 1.163330078125, 1.2823486328125, 1.4013671875, 1.5203857421875, 1.639404296875, 1.7584228515625, 1.87744140625, 1.9964599609375, 2.115478515625, 2.2344970703125, 2.353515625, 2.4725341796875, 2.591552734375, 2.7105712890625, 2.82958984375, 2.9486083984375, 3.067626953125, 3.1866455078125, 3.3056640625, 3.4246826171875, 3.543701171875, 3.6627197265625, 3.78173828125, 3.9007568359375, 4.019775390625, 4.1387939453125, 4.2578125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 7.0, 9.0, 9.0, 5.0, 10.0, 31.0, 19.0, 24.0, 29.0, 30.0, 32.0, 36.0, 33.0, 33.0, 56.0, 38.0, 41.0, 52.0, 36.0, 56.0, 44.0, 47.0, 45.0, 47.0, 39.0, 36.0, 37.0, 16.0, 16.0, 16.0, 18.0, 12.0, 13.0, 10.0, 2.0, 7.0, 2.0, 4.0, 2.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.517578125, -2.42388916015625, -2.3302001953125, -2.23651123046875, -2.142822265625, -2.04913330078125, -1.9554443359375, -1.86175537109375, -1.76806640625, -1.67437744140625, -1.5806884765625, -1.48699951171875, -1.393310546875, -1.29962158203125, -1.2059326171875, -1.11224365234375, -1.0185546875, -0.92486572265625, -0.8311767578125, -0.73748779296875, -0.643798828125, -0.55010986328125, -0.4564208984375, -0.36273193359375, -0.26904296875, -0.17535400390625, -0.0816650390625, 0.01202392578125, 0.105712890625, 0.19940185546875, 0.2930908203125, 0.38677978515625, 0.48046875, 0.57415771484375, 0.6678466796875, 0.76153564453125, 0.855224609375, 0.94891357421875, 1.0426025390625, 1.13629150390625, 1.22998046875, 1.32366943359375, 1.4173583984375, 1.51104736328125, 1.604736328125, 1.69842529296875, 1.7921142578125, 1.88580322265625, 1.9794921875, 2.07318115234375, 2.1668701171875, 2.26055908203125, 2.354248046875, 2.44793701171875, 2.5416259765625, 2.63531494140625, 2.72900390625, 2.82269287109375, 2.9163818359375, 3.01007080078125, 3.103759765625, 3.19744873046875, 3.2911376953125, 3.38482666015625, 3.478515625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 5.0, 5.0, 9.0, 7.0, 13.0, 17.0, 24.0, 52.0, 112.0, 232.0, 685.0, 2036.0, 8225.0, 67299.0, 871434.0, 85538.0, 9240.0, 2369.0, 723.0, 262.0, 116.0, 51.0, 23.0, 23.0, 18.0, 6.0, 9.0, 7.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.099609375, -2.028533935546875, -1.95745849609375, -1.886383056640625, -1.8153076171875, -1.744232177734375, -1.67315673828125, -1.602081298828125, -1.531005859375, -1.459930419921875, -1.38885498046875, -1.317779541015625, -1.2467041015625, -1.175628662109375, -1.10455322265625, -1.033477783203125, -0.96240234375, -0.891326904296875, -0.82025146484375, -0.749176025390625, -0.6781005859375, -0.607025146484375, -0.53594970703125, -0.464874267578125, -0.393798828125, -0.322723388671875, -0.25164794921875, -0.180572509765625, -0.1094970703125, -0.038421630859375, 0.03265380859375, 0.103729248046875, 0.1748046875, 0.245880126953125, 0.31695556640625, 0.388031005859375, 0.4591064453125, 0.530181884765625, 0.60125732421875, 0.672332763671875, 0.743408203125, 0.814483642578125, 0.88555908203125, 0.956634521484375, 1.0277099609375, 1.098785400390625, 1.16986083984375, 1.240936279296875, 1.31201171875, 1.383087158203125, 1.45416259765625, 1.525238037109375, 1.5963134765625, 1.667388916015625, 1.73846435546875, 1.809539794921875, 1.880615234375, 1.951690673828125, 2.02276611328125, 2.093841552734375, 2.1649169921875, 2.235992431640625, 2.30706787109375, 2.378143310546875, 2.44921875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 7.0, 7.0, 10.0, 14.0, 28.0, 29.0, 54.0, 98.0, 181.0, 207.0, 141.0, 80.0, 54.0, 28.0, 17.0, 10.0, 15.0, 7.0, 6.0, 5.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002503395080566406, -0.00023960694670677185, -0.00022887438535690308, -0.0002181418240070343, -0.00020740926265716553, -0.00019667670130729675, -0.00018594413995742798, -0.0001752115786075592, -0.00016447901725769043, -0.00015374645590782166, -0.00014301389455795288, -0.0001322813332080841, -0.00012154877185821533, -0.00011081621050834656, -0.00010008364915847778, -8.935108780860901e-05, -7.861852645874023e-05, -6.788596510887146e-05, -5.7153403759002686e-05, -4.642084240913391e-05, -3.568828105926514e-05, -2.4955719709396362e-05, -1.4223158359527588e-05, -3.4905970096588135e-06, 7.241964340209961e-06, 1.7974525690078735e-05, 2.870708703994751e-05, 3.9439648389816284e-05, 5.017220973968506e-05, 6.090477108955383e-05, 7.163733243942261e-05, 8.236989378929138e-05, 9.310245513916016e-05, 0.00010383501648902893, 0.0001145675778388977, 0.00012530013918876648, 0.00013603270053863525, 0.00014676526188850403, 0.0001574978232383728, 0.00016823038458824158, 0.00017896294593811035, 0.00018969550728797913, 0.0002004280686378479, 0.00021116062998771667, 0.00022189319133758545, 0.00023262575268745422, 0.000243358314037323, 0.00025409087538719177, 0.00026482343673706055, 0.0002755559980869293, 0.0002862885594367981, 0.00029702112078666687, 0.00030775368213653564, 0.0003184862434864044, 0.0003292188048362732, 0.00033995136618614197, 0.00035068392753601074, 0.0003614164888858795, 0.0003721490502357483, 0.00038288161158561707, 0.00039361417293548584, 0.0004043467342853546, 0.0004150792956352234, 0.00042581185698509216, 0.00043654441833496094]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 6.0, 9.0, 1.0, 10.0, 17.0, 14.0, 28.0, 53.0, 91.0, 120.0, 278.0, 612.0, 1851.0, 9024.0, 81355.0, 867634.0, 76208.0, 8227.0, 1759.0, 630.0, 258.0, 137.0, 73.0, 61.0, 36.0, 23.0, 14.0, 14.0, 8.0, 1.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.9208984375, -1.8534698486328125, -1.786041259765625, -1.7186126708984375, -1.65118408203125, -1.5837554931640625, -1.516326904296875, -1.4488983154296875, -1.3814697265625, -1.3140411376953125, -1.246612548828125, -1.1791839599609375, -1.11175537109375, -1.0443267822265625, -0.976898193359375, -0.9094696044921875, -0.842041015625, -0.7746124267578125, -0.707183837890625, -0.6397552490234375, -0.57232666015625, -0.5048980712890625, -0.437469482421875, -0.3700408935546875, -0.3026123046875, -0.2351837158203125, -0.167755126953125, -0.1003265380859375, -0.03289794921875, 0.0345306396484375, 0.101959228515625, 0.1693878173828125, 0.23681640625, 0.3042449951171875, 0.371673583984375, 0.4391021728515625, 0.50653076171875, 0.5739593505859375, 0.641387939453125, 0.7088165283203125, 0.7762451171875, 0.8436737060546875, 0.911102294921875, 0.9785308837890625, 1.04595947265625, 1.1133880615234375, 1.180816650390625, 1.2482452392578125, 1.315673828125, 1.3831024169921875, 1.450531005859375, 1.5179595947265625, 1.58538818359375, 1.6528167724609375, 1.720245361328125, 1.7876739501953125, 1.8551025390625, 1.9225311279296875, 1.989959716796875, 2.0573883056640625, 2.12481689453125, 2.1922454833984375, 2.259674072265625, 2.3271026611328125, 2.39453125]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 5.0, 3.0, 6.0, 9.0, 3.0, 8.0, 13.0, 20.0, 24.0, 26.0, 29.0, 44.0, 75.0, 116.0, 129.0, 126.0, 111.0, 79.0, 51.0, 27.0, 30.0, 22.0, 15.0, 10.0, 5.0, 3.0, 12.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-1.49609375, -1.4611434936523438, -1.4261932373046875, -1.3912429809570312, -1.356292724609375, -1.3213424682617188, -1.2863922119140625, -1.2514419555664062, -1.21649169921875, -1.1815414428710938, -1.1465911865234375, -1.1116409301757812, -1.076690673828125, -1.0417404174804688, -1.0067901611328125, -0.9718399047851562, -0.9368896484375, -0.9019393920898438, -0.8669891357421875, -0.8320388793945312, -0.797088623046875, -0.7621383666992188, -0.7271881103515625, -0.6922378540039062, -0.65728759765625, -0.6223373413085938, -0.5873870849609375, -0.5524368286132812, -0.517486572265625, -0.48253631591796875, -0.4475860595703125, -0.41263580322265625, -0.377685546875, -0.34273529052734375, -0.3077850341796875, -0.27283477783203125, -0.237884521484375, -0.20293426513671875, -0.1679840087890625, -0.13303375244140625, -0.09808349609375, -0.06313323974609375, -0.0281829833984375, 0.00676727294921875, 0.041717529296875, 0.07666778564453125, 0.1116180419921875, 0.14656829833984375, 0.1815185546875, 0.21646881103515625, 0.2514190673828125, 0.28636932373046875, 0.321319580078125, 0.35626983642578125, 0.3912200927734375, 0.42617034912109375, 0.46112060546875, 0.49607086181640625, 0.5310211181640625, 0.5659713745117188, 0.600921630859375, 0.6358718872070312, 0.6708221435546875, 0.7057723999023438, 0.74072265625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 0.0, 4.0, 3.0, 29.0, 64.0, 175.0, 275.0, 224.0, 129.0, 65.0, 19.0, 10.0, 5.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.359935760498047, -23.333763122558594, -22.30759048461914, -21.281415939331055, -20.2552433013916, -19.22907066345215, -18.202896118164062, -17.17672348022461, -16.150550842285156, -15.124378204345703, -14.098204612731934, -13.072031021118164, -12.045858383178711, -11.019685745239258, -9.993512153625488, -8.967338562011719, -7.941165924072266, -6.914992809295654, -5.888819694519043, -4.862646579742432, -3.8364734649658203, -2.810300350189209, -1.7841272354125977, -0.7579541206359863, 0.268218994140625, 1.2943921089172363, 2.3205652236938477, 3.346738338470459, 4.37291145324707, 5.399084568023682, 6.425257682800293, 7.451430797576904, 8.477607727050781, 9.503780364990234, 10.529953956604004, 11.556127548217773, 12.582300186157227, 13.60847282409668, 14.63464641571045, 15.660820007324219, 16.686992645263672, 17.713165283203125, 18.739337921142578, 19.765512466430664, 20.791685104370117, 21.81785774230957, 22.844032287597656, 23.87020492553711, 24.896377563476562, 25.922550201416016, 26.94872283935547, 27.974897384643555, 29.001070022583008, 30.02724266052246, 31.053417205810547, 32.07958984375, 33.10576248168945, 34.131935119628906, 35.15810775756836, 36.18428039550781, 37.21045684814453, 38.236629486083984, 39.26280212402344, 40.28897476196289, 41.315147399902344]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 5.0, 1.0, 4.0, 1.0, 4.0, 1.0, 5.0, 5.0, 7.0, 7.0, 11.0, 14.0, 14.0, 17.0, 22.0, 21.0, 16.0, 17.0, 16.0, 28.0, 27.0, 32.0, 27.0, 47.0, 37.0, 52.0, 38.0, 36.0, 36.0, 38.0, 47.0, 37.0, 36.0, 31.0, 25.0, 30.0, 30.0, 34.0, 22.0, 19.0, 18.0, 15.0, 13.0, 13.0, 14.0, 10.0, 6.0, 5.0, 3.0, 1.0, 3.0, 6.0, 1.0, 1.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0], "bins": [-12.554769515991211, -12.159811019897461, -11.764853477478027, -11.369894981384277, -10.974937438964844, -10.579978942871094, -10.18502140045166, -9.79006290435791, -9.395105361938477, -9.000146865844727, -8.605189323425293, -8.210230827331543, -7.815273284912109, -7.420315265655518, -7.025357246398926, -6.630398750305176, -6.235440731048584, -5.840482711791992, -5.4455246925354, -5.050566673278809, -4.655608654022217, -4.260650634765625, -3.865692377090454, -3.4707343578338623, -3.0757763385772705, -2.6808183193206787, -2.285860300064087, -1.8909021615982056, -1.4959441423416138, -1.100986123085022, -0.7060279846191406, -0.31106996536254883, 0.08388805389404297, 0.47884610295295715, 0.8738041520118713, 1.268762230873108, 1.6637202501296997, 2.058678150177002, 2.453636407852173, 2.8485944271087646, 3.2435524463653564, 3.6385104656219482, 4.033468723297119, 4.428426742553711, 4.823384761810303, 5.2183427810668945, 5.613300800323486, 6.008258819580078, 6.40321683883667, 6.798174858093262, 7.1931328773498535, 7.588090896606445, 7.983048915863037, 8.378006935119629, 8.772965431213379, 9.167922973632812, 9.562881469726562, 9.957839965820312, 10.352797508239746, 10.747756004333496, 11.14271354675293, 11.53767204284668, 11.932629585266113, 12.327588081359863, 12.722545623779297]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 2.0, 4.0, 9.0, 14.0, 8.0, 20.0, 21.0, 29.0, 36.0, 54.0, 117.0, 165.0, 343.0, 687.0, 1796.0, 5623.0, 27338.0, 1009159.0, 3108117.0, 31400.0, 6080.0, 1867.0, 712.0, 293.0, 161.0, 97.0, 49.0, 27.0, 18.0, 13.0, 9.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-6.82421875, -6.644775390625, -6.46533203125, -6.285888671875, -6.1064453125, -5.927001953125, -5.74755859375, -5.568115234375, -5.388671875, -5.209228515625, -5.02978515625, -4.850341796875, -4.6708984375, -4.491455078125, -4.31201171875, -4.132568359375, -3.953125, -3.773681640625, -3.59423828125, -3.414794921875, -3.2353515625, -3.055908203125, -2.87646484375, -2.697021484375, -2.517578125, -2.338134765625, -2.15869140625, -1.979248046875, -1.7998046875, -1.620361328125, -1.44091796875, -1.261474609375, -1.08203125, -0.902587890625, -0.72314453125, -0.543701171875, -0.3642578125, -0.184814453125, -0.00537109375, 0.174072265625, 0.353515625, 0.532958984375, 0.71240234375, 0.891845703125, 1.0712890625, 1.250732421875, 1.43017578125, 1.609619140625, 1.7890625, 1.968505859375, 2.14794921875, 2.327392578125, 2.5068359375, 2.686279296875, 2.86572265625, 3.045166015625, 3.224609375, 3.404052734375, 3.58349609375, 3.762939453125, 3.9423828125, 4.121826171875, 4.30126953125, 4.480712890625, 4.66015625]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 9.0, 5.0, 9.0, 18.0, 17.0, 26.0, 38.0, 55.0, 61.0, 76.0, 80.0, 76.0, 81.0, 82.0, 69.0, 76.0, 64.0, 48.0, 43.0, 32.0, 13.0, 9.0, 7.0, 2.0, 6.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.8076171875, -1.7658462524414062, -1.7240753173828125, -1.6823043823242188, -1.640533447265625, -1.5987625122070312, -1.5569915771484375, -1.5152206420898438, -1.47344970703125, -1.4316787719726562, -1.3899078369140625, -1.3481369018554688, -1.306365966796875, -1.2645950317382812, -1.2228240966796875, -1.1810531616210938, -1.1392822265625, -1.0975112915039062, -1.0557403564453125, -1.0139694213867188, -0.972198486328125, -0.9304275512695312, -0.8886566162109375, -0.8468856811523438, -0.80511474609375, -0.7633438110351562, -0.7215728759765625, -0.6798019409179688, -0.638031005859375, -0.5962600708007812, -0.5544891357421875, -0.5127182006835938, -0.470947265625, -0.42917633056640625, -0.3874053955078125, -0.34563446044921875, -0.303863525390625, -0.26209259033203125, -0.2203216552734375, -0.17855072021484375, -0.13677978515625, -0.09500885009765625, -0.0532379150390625, -0.01146697998046875, 0.030303955078125, 0.07207489013671875, 0.1138458251953125, 0.15561676025390625, 0.1973876953125, 0.23915863037109375, 0.2809295654296875, 0.32270050048828125, 0.364471435546875, 0.40624237060546875, 0.4480133056640625, 0.48978424072265625, 0.53155517578125, 0.5733261108398438, 0.6150970458984375, 0.6568679809570312, 0.698638916015625, 0.7404098510742188, 0.7821807861328125, 0.8239517211914062, 0.86572265625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 8.0, 5.0, 5.0, 17.0, 30.0, 49.0, 55.0, 106.0, 148.0, 287.0, 539.0, 1374.0, 4325.0, 25901.0, 3239776.0, 894705.0, 20795.0, 3918.0, 1203.0, 503.0, 234.0, 127.0, 66.0, 45.0, 34.0, 15.0, 6.0, 2.0, 6.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0], "bins": [-9.1875, -8.97845458984375, -8.7694091796875, -8.56036376953125, -8.351318359375, -8.14227294921875, -7.9332275390625, -7.72418212890625, -7.51513671875, -7.30609130859375, -7.0970458984375, -6.88800048828125, -6.678955078125, -6.46990966796875, -6.2608642578125, -6.05181884765625, -5.8427734375, -5.63372802734375, -5.4246826171875, -5.21563720703125, -5.006591796875, -4.79754638671875, -4.5885009765625, -4.37945556640625, -4.17041015625, -3.96136474609375, -3.7523193359375, -3.54327392578125, -3.334228515625, -3.12518310546875, -2.9161376953125, -2.70709228515625, -2.498046875, -2.28900146484375, -2.0799560546875, -1.87091064453125, -1.661865234375, -1.45281982421875, -1.2437744140625, -1.03472900390625, -0.82568359375, -0.61663818359375, -0.4075927734375, -0.19854736328125, 0.010498046875, 0.21954345703125, 0.4285888671875, 0.63763427734375, 0.8466796875, 1.05572509765625, 1.2647705078125, 1.47381591796875, 1.682861328125, 1.89190673828125, 2.1009521484375, 2.30999755859375, 2.51904296875, 2.72808837890625, 2.9371337890625, 3.14617919921875, 3.355224609375, 3.56427001953125, 3.7733154296875, 3.98236083984375, 4.19140625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 7.0, 11.0, 22.0, 21.0, 48.0, 132.0, 482.0, 2773.0, 373.0, 100.0, 43.0, 24.0, 14.0, 11.0, 5.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.513671875, -3.432830810546875, -3.35198974609375, -3.271148681640625, -3.1903076171875, -3.109466552734375, -3.02862548828125, -2.947784423828125, -2.866943359375, -2.786102294921875, -2.70526123046875, -2.624420166015625, -2.5435791015625, -2.462738037109375, -2.38189697265625, -2.301055908203125, -2.22021484375, -2.139373779296875, -2.05853271484375, -1.977691650390625, -1.8968505859375, -1.816009521484375, -1.73516845703125, -1.654327392578125, -1.573486328125, -1.492645263671875, -1.41180419921875, -1.330963134765625, -1.2501220703125, -1.169281005859375, -1.08843994140625, -1.007598876953125, -0.9267578125, -0.845916748046875, -0.76507568359375, -0.684234619140625, -0.6033935546875, -0.522552490234375, -0.44171142578125, -0.360870361328125, -0.280029296875, -0.199188232421875, -0.11834716796875, -0.037506103515625, 0.0433349609375, 0.124176025390625, 0.20501708984375, 0.285858154296875, 0.36669921875, 0.447540283203125, 0.52838134765625, 0.609222412109375, 0.6900634765625, 0.770904541015625, 0.85174560546875, 0.932586669921875, 1.013427734375, 1.094268798828125, 1.17510986328125, 1.255950927734375, 1.3367919921875, 1.417633056640625, 1.49847412109375, 1.579315185546875, 1.66015625]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 6.0, 9.0, 15.0, 46.0, 129.0, 277.0, 292.0, 139.0, 63.0, 19.0, 6.0, 8.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-26.064916610717773, -25.56854820251465, -25.072181701660156, -24.57581329345703, -24.079444885253906, -23.583078384399414, -23.08670997619629, -22.590341567993164, -22.093975067138672, -21.597606658935547, -21.101240158081055, -20.60487174987793, -20.108503341674805, -19.612136840820312, -19.115768432617188, -18.619400024414062, -18.123031616210938, -17.626663208007812, -17.13029670715332, -16.633928298950195, -16.13755989074707, -15.641193389892578, -15.144824981689453, -14.648457527160645, -14.152090072631836, -13.655722618103027, -13.159354209899902, -12.662986755371094, -12.166619300842285, -11.670251846313477, -11.173883438110352, -10.677515983581543, -10.181148529052734, -9.684781074523926, -9.1884126663208, -8.692045211791992, -8.195677757263184, -7.699309825897217, -7.20294189453125, -6.706574440002441, -6.210206031799316, -5.71383810043335, -5.217470645904541, -4.721102714538574, -4.224735260009766, -3.728367328643799, -3.231999397277832, -2.7356317043304443, -2.2392640113830566, -1.742896318435669, -1.2465285062789917, -0.7501606941223145, -0.25379300117492676, 0.24257469177246094, 0.7389426231384277, 1.2353103160858154, 1.7316780090332031, 2.228045701980591, 2.7244133949279785, 3.2207813262939453, 3.717149019241333, 4.213516712188721, 4.7098846435546875, 5.206252098083496, 5.702620029449463]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 4.0, 7.0, 19.0, 19.0, 34.0, 29.0, 53.0, 78.0, 83.0, 98.0, 110.0, 82.0, 88.0, 73.0, 90.0, 40.0, 36.0, 22.0, 15.0, 13.0, 12.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.387171745300293, -11.07668685913086, -10.766201972961426, -10.455717086791992, -10.145232200622559, -9.834747314453125, -9.524262428283691, -9.213777542114258, -8.903291702270508, -8.592806816101074, -8.28232192993164, -7.971837043762207, -7.661352157592773, -7.35086727142334, -7.040381908416748, -6.7298970222473145, -6.419412612915039, -6.1089277267456055, -5.798442840576172, -5.487957954406738, -5.177473068237305, -4.866988182067871, -4.556502819061279, -4.246017932891846, -3.935533046722412, -3.6250481605529785, -3.314563274383545, -3.0040781497955322, -2.6935932636260986, -2.383108377456665, -2.0726232528686523, -1.7621383666992188, -1.4516544342041016, -1.141169548034668, -0.8306845426559448, -0.5201995968818665, -0.20971465110778809, 0.10077023506164551, 0.41125524044036865, 0.7217402458190918, 1.0322251319885254, 1.342710018157959, 1.6531950235366821, 1.9636800289154053, 2.274164915084839, 2.5846498012542725, 2.895134925842285, 3.2056198120117188, 3.5161046981811523, 3.826589584350586, 4.1370744705200195, 4.447559356689453, 4.758044242858887, 5.06852912902832, 5.379014492034912, 5.689499378204346, 5.999984264373779, 6.310469150543213, 6.6209540367126465, 6.93143892288208, 7.241924285888672, 7.5524091720581055, 7.862894058227539, 8.173378944396973, 8.483863830566406]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 5.0, 12.0, 13.0, 22.0, 48.0, 132.0, 282.0, 1213.0, 10947.0, 625040.0, 401102.0, 8301.0, 939.0, 296.0, 105.0, 44.0, 26.0, 11.0, 9.0, 6.0, 5.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.3515625, -14.0250244140625, -13.698486328125, -13.3719482421875, -13.04541015625, -12.7188720703125, -12.392333984375, -12.0657958984375, -11.7392578125, -11.4127197265625, -11.086181640625, -10.7596435546875, -10.43310546875, -10.1065673828125, -9.780029296875, -9.4534912109375, -9.126953125, -8.8004150390625, -8.473876953125, -8.1473388671875, -7.82080078125, -7.4942626953125, -7.167724609375, -6.8411865234375, -6.5146484375, -6.1881103515625, -5.861572265625, -5.5350341796875, -5.20849609375, -4.8819580078125, -4.555419921875, -4.2288818359375, -3.90234375, -3.5758056640625, -3.249267578125, -2.9227294921875, -2.59619140625, -2.2696533203125, -1.943115234375, -1.6165771484375, -1.2900390625, -0.9635009765625, -0.636962890625, -0.3104248046875, 0.01611328125, 0.3426513671875, 0.669189453125, 0.9957275390625, 1.322265625, 1.6488037109375, 1.975341796875, 2.3018798828125, 2.62841796875, 2.9549560546875, 3.281494140625, 3.6080322265625, 3.9345703125, 4.2611083984375, 4.587646484375, 4.9141845703125, 5.24072265625, 5.5672607421875, 5.893798828125, 6.2203369140625, 6.546875]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 4.0, 5.0, 13.0, 16.0, 14.0, 40.0, 46.0, 63.0, 60.0, 78.0, 78.0, 89.0, 111.0, 73.0, 80.0, 66.0, 61.0, 32.0, 33.0, 17.0, 10.0, 6.0, 1.0, 1.0, 5.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-2.07421875, -2.02777099609375, -1.9813232421875, -1.93487548828125, -1.888427734375, -1.84197998046875, -1.7955322265625, -1.74908447265625, -1.70263671875, -1.65618896484375, -1.6097412109375, -1.56329345703125, -1.516845703125, -1.47039794921875, -1.4239501953125, -1.37750244140625, -1.3310546875, -1.28460693359375, -1.2381591796875, -1.19171142578125, -1.145263671875, -1.09881591796875, -1.0523681640625, -1.00592041015625, -0.95947265625, -0.91302490234375, -0.8665771484375, -0.82012939453125, -0.773681640625, -0.72723388671875, -0.6807861328125, -0.63433837890625, -0.587890625, -0.54144287109375, -0.4949951171875, -0.44854736328125, -0.402099609375, -0.35565185546875, -0.3092041015625, -0.26275634765625, -0.21630859375, -0.16986083984375, -0.1234130859375, -0.07696533203125, -0.030517578125, 0.01593017578125, 0.0623779296875, 0.10882568359375, 0.1552734375, 0.20172119140625, 0.2481689453125, 0.29461669921875, 0.341064453125, 0.38751220703125, 0.4339599609375, 0.48040771484375, 0.52685546875, 0.57330322265625, 0.6197509765625, 0.66619873046875, 0.712646484375, 0.75909423828125, 0.8055419921875, 0.85198974609375, 0.8984375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 6.0, 2.0, 2.0, 7.0, 12.0, 9.0, 15.0, 17.0, 27.0, 36.0, 44.0, 78.0, 99.0, 132.0, 292.0, 559.0, 1538.0, 6038.0, 29710.0, 179908.0, 651940.0, 145598.0, 24655.0, 5150.0, 1363.0, 528.0, 254.0, 172.0, 90.0, 63.0, 48.0, 41.0, 39.0, 26.0, 18.0, 10.0, 11.0, 5.0, 6.0, 5.0, 3.0, 5.0, 1.0, 2.0, 1.0], "bins": [-4.46484375, -4.351654052734375, -4.23846435546875, -4.125274658203125, -4.0120849609375, -3.898895263671875, -3.78570556640625, -3.672515869140625, -3.559326171875, -3.446136474609375, -3.33294677734375, -3.219757080078125, -3.1065673828125, -2.993377685546875, -2.88018798828125, -2.766998291015625, -2.65380859375, -2.540618896484375, -2.42742919921875, -2.314239501953125, -2.2010498046875, -2.087860107421875, -1.97467041015625, -1.861480712890625, -1.748291015625, -1.635101318359375, -1.52191162109375, -1.408721923828125, -1.2955322265625, -1.182342529296875, -1.06915283203125, -0.955963134765625, -0.8427734375, -0.729583740234375, -0.61639404296875, -0.503204345703125, -0.3900146484375, -0.276824951171875, -0.16363525390625, -0.050445556640625, 0.062744140625, 0.175933837890625, 0.28912353515625, 0.402313232421875, 0.5155029296875, 0.628692626953125, 0.74188232421875, 0.855072021484375, 0.96826171875, 1.081451416015625, 1.19464111328125, 1.307830810546875, 1.4210205078125, 1.534210205078125, 1.64739990234375, 1.760589599609375, 1.873779296875, 1.986968994140625, 2.10015869140625, 2.213348388671875, 2.3265380859375, 2.439727783203125, 2.55291748046875, 2.666107177734375, 2.779296875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 0.0, 3.0, 2.0, 2.0, 5.0, 5.0, 9.0, 8.0, 11.0, 15.0, 15.0, 14.0, 17.0, 20.0, 20.0, 26.0, 29.0, 33.0, 34.0, 35.0, 41.0, 44.0, 46.0, 44.0, 46.0, 54.0, 41.0, 34.0, 38.0, 35.0, 43.0, 44.0, 33.0, 27.0, 22.0, 23.0, 11.0, 22.0, 15.0, 9.0, 11.0, 7.0, 5.0, 5.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.259765625, -3.166748046875, -3.07373046875, -2.980712890625, -2.8876953125, -2.794677734375, -2.70166015625, -2.608642578125, -2.515625, -2.422607421875, -2.32958984375, -2.236572265625, -2.1435546875, -2.050537109375, -1.95751953125, -1.864501953125, -1.771484375, -1.678466796875, -1.58544921875, -1.492431640625, -1.3994140625, -1.306396484375, -1.21337890625, -1.120361328125, -1.02734375, -0.934326171875, -0.84130859375, -0.748291015625, -0.6552734375, -0.562255859375, -0.46923828125, -0.376220703125, -0.283203125, -0.190185546875, -0.09716796875, -0.004150390625, 0.0888671875, 0.181884765625, 0.27490234375, 0.367919921875, 0.4609375, 0.553955078125, 0.64697265625, 0.739990234375, 0.8330078125, 0.926025390625, 1.01904296875, 1.112060546875, 1.205078125, 1.298095703125, 1.39111328125, 1.484130859375, 1.5771484375, 1.670166015625, 1.76318359375, 1.856201171875, 1.94921875, 2.042236328125, 2.13525390625, 2.228271484375, 2.3212890625, 2.414306640625, 2.50732421875, 2.600341796875, 2.693359375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 2.0, 4.0, 4.0, 4.0, 9.0, 10.0, 7.0, 18.0, 23.0, 43.0, 66.0, 122.0, 177.0, 375.0, 810.0, 2081.0, 6570.0, 27282.0, 144842.0, 648490.0, 174832.0, 31316.0, 7423.0, 2271.0, 833.0, 400.0, 216.0, 120.0, 63.0, 40.0, 29.0, 22.0, 18.0, 8.0, 6.0, 6.0, 4.0, 2.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.03125, -0.9995651245117188, -0.9678802490234375, -0.9361953735351562, -0.904510498046875, -0.8728256225585938, -0.8411407470703125, -0.8094558715820312, -0.77777099609375, -0.7460861206054688, -0.7144012451171875, -0.6827163696289062, -0.651031494140625, -0.6193466186523438, -0.5876617431640625, -0.5559768676757812, -0.5242919921875, -0.49260711669921875, -0.4609222412109375, -0.42923736572265625, -0.397552490234375, -0.36586761474609375, -0.3341827392578125, -0.30249786376953125, -0.27081298828125, -0.23912811279296875, -0.2074432373046875, -0.17575836181640625, -0.144073486328125, -0.11238861083984375, -0.0807037353515625, -0.04901885986328125, -0.017333984375, 0.01435089111328125, 0.0460357666015625, 0.07772064208984375, 0.109405517578125, 0.14109039306640625, 0.1727752685546875, 0.20446014404296875, 0.23614501953125, 0.26782989501953125, 0.2995147705078125, 0.33119964599609375, 0.362884521484375, 0.39456939697265625, 0.4262542724609375, 0.45793914794921875, 0.4896240234375, 0.5213088989257812, 0.5529937744140625, 0.5846786499023438, 0.616363525390625, 0.6480484008789062, 0.6797332763671875, 0.7114181518554688, 0.74310302734375, 0.7747879028320312, 0.8064727783203125, 0.8381576538085938, 0.869842529296875, 0.9015274047851562, 0.9332122802734375, 0.9648971557617188, 0.99658203125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 1.0, 3.0, 5.0, 4.0, 9.0, 11.0, 9.0, 15.0, 45.0, 55.0, 81.0, 194.0, 193.0, 166.0, 77.0, 53.0, 22.0, 21.0, 8.0, 8.0, 4.0, 6.0, 2.0, 2.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.000438690185546875, -0.00042694807052612305, -0.0004152059555053711, -0.00040346384048461914, -0.0003917217254638672, -0.00037997961044311523, -0.0003682374954223633, -0.00035649538040161133, -0.0003447532653808594, -0.0003330111503601074, -0.00032126903533935547, -0.0003095269203186035, -0.00029778480529785156, -0.0002860426902770996, -0.00027430057525634766, -0.0002625584602355957, -0.00025081634521484375, -0.0002390742301940918, -0.00022733211517333984, -0.0002155900001525879, -0.00020384788513183594, -0.00019210577011108398, -0.00018036365509033203, -0.00016862154006958008, -0.00015687942504882812, -0.00014513731002807617, -0.00013339519500732422, -0.00012165307998657227, -0.00010991096496582031, -9.816884994506836e-05, -8.64267349243164e-05, -7.468461990356445e-05, -6.29425048828125e-05, -5.120038986206055e-05, -3.9458274841308594e-05, -2.771615982055664e-05, -1.5974044799804688e-05, -4.231929779052734e-06, 7.510185241699219e-06, 1.9252300262451172e-05, 3.0994415283203125e-05, 4.273653030395508e-05, 5.447864532470703e-05, 6.622076034545898e-05, 7.796287536621094e-05, 8.970499038696289e-05, 0.00010144710540771484, 0.0001131892204284668, 0.00012493133544921875, 0.0001366734504699707, 0.00014841556549072266, 0.0001601576805114746, 0.00017189979553222656, 0.00018364191055297852, 0.00019538402557373047, 0.00020712614059448242, 0.00021886825561523438, 0.00023061037063598633, 0.00024235248565673828, 0.00025409460067749023, 0.0002658367156982422, 0.00027757883071899414, 0.0002893209457397461, 0.00030106306076049805, 0.00031280517578125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 5.0, 9.0, 9.0, 11.0, 24.0, 26.0, 40.0, 92.0, 132.0, 227.0, 489.0, 1126.0, 3228.0, 14842.0, 108146.0, 701571.0, 187910.0, 23533.0, 4546.0, 1362.0, 562.0, 277.0, 138.0, 80.0, 52.0, 34.0, 32.0, 11.0, 11.0, 5.0, 7.0, 6.0, 5.0, 5.0, 1.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.91748046875, -0.8816757202148438, -0.8458709716796875, -0.8100662231445312, -0.774261474609375, -0.7384567260742188, -0.7026519775390625, -0.6668472290039062, -0.63104248046875, -0.5952377319335938, -0.5594329833984375, -0.5236282348632812, -0.487823486328125, -0.45201873779296875, -0.4162139892578125, -0.38040924072265625, -0.3446044921875, -0.30879974365234375, -0.2729949951171875, -0.23719024658203125, -0.201385498046875, -0.16558074951171875, -0.1297760009765625, -0.09397125244140625, -0.05816650390625, -0.02236175537109375, 0.0134429931640625, 0.04924774169921875, 0.085052490234375, 0.12085723876953125, 0.1566619873046875, 0.19246673583984375, 0.228271484375, 0.26407623291015625, 0.2998809814453125, 0.33568572998046875, 0.371490478515625, 0.40729522705078125, 0.4430999755859375, 0.47890472412109375, 0.51470947265625, 0.5505142211914062, 0.5863189697265625, 0.6221237182617188, 0.657928466796875, 0.6937332153320312, 0.7295379638671875, 0.7653427124023438, 0.8011474609375, 0.8369522094726562, 0.8727569580078125, 0.9085617065429688, 0.944366455078125, 0.9801712036132812, 1.0159759521484375, 1.0517807006835938, 1.08758544921875, 1.1233901977539062, 1.1591949462890625, 1.1949996948242188, 1.230804443359375, 1.2666091918945312, 1.3024139404296875, 1.3382186889648438, 1.3740234375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 5.0, 8.0, 12.0, 9.0, 20.0, 27.0, 44.0, 57.0, 63.0, 121.0, 145.0, 139.0, 82.0, 78.0, 57.0, 44.0, 30.0, 13.0, 20.0, 12.0, 6.0, 3.0, 4.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.76953125, -0.7410125732421875, -0.712493896484375, -0.6839752197265625, -0.65545654296875, -0.6269378662109375, -0.598419189453125, -0.5699005126953125, -0.5413818359375, -0.5128631591796875, -0.484344482421875, -0.4558258056640625, -0.42730712890625, -0.3987884521484375, -0.370269775390625, -0.3417510986328125, -0.313232421875, -0.2847137451171875, -0.256195068359375, -0.2276763916015625, -0.19915771484375, -0.1706390380859375, -0.142120361328125, -0.1136016845703125, -0.0850830078125, -0.0565643310546875, -0.028045654296875, 0.0004730224609375, 0.02899169921875, 0.0575103759765625, 0.086029052734375, 0.1145477294921875, 0.14306640625, 0.1715850830078125, 0.200103759765625, 0.2286224365234375, 0.25714111328125, 0.2856597900390625, 0.314178466796875, 0.3426971435546875, 0.3712158203125, 0.3997344970703125, 0.428253173828125, 0.4567718505859375, 0.48529052734375, 0.5138092041015625, 0.542327880859375, 0.5708465576171875, 0.599365234375, 0.6278839111328125, 0.656402587890625, 0.6849212646484375, 0.71343994140625, 0.7419586181640625, 0.770477294921875, 0.7989959716796875, 0.8275146484375, 0.8560333251953125, 0.884552001953125, 0.9130706787109375, 0.94158935546875, 0.9701080322265625, 0.998626708984375, 1.0271453857421875, 1.0556640625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 7.0, 10.0, 23.0, 86.0, 202.0, 283.0, 254.0, 81.0, 44.0, 15.0, 8.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.402024269104004, -10.21059799194336, -9.019170761108398, -7.827744007110596, -6.636317253112793, -5.44489049911499, -4.2534637451171875, -3.062037467956543, -1.870610237121582, -0.6791834831237793, 0.5122432708740234, 1.7036700248718262, 2.895096778869629, 4.086523532867432, 5.277950286865234, 6.469376564025879, 7.66080379486084, 8.852230072021484, 10.043657302856445, 11.235084533691406, 12.42651081085205, 13.617937088012695, 14.809364318847656, 16.000789642333984, 17.192218780517578, 18.38364601135254, 19.5750732421875, 20.766498565673828, 21.95792579650879, 23.14935302734375, 24.340778350830078, 25.53220558166504, 26.7236328125, 27.91506004333496, 29.106487274169922, 30.29791259765625, 31.48933982849121, 32.68076705932617, 33.8721923828125, 35.063621520996094, 36.25504684448242, 37.44647216796875, 38.637901306152344, 39.82932662963867, 41.020751953125, 42.212181091308594, 43.40360641479492, 44.59503173828125, 45.786460876464844, 46.97788619995117, 48.169315338134766, 49.360740661621094, 50.55216979980469, 51.743595123291016, 52.935020446777344, 54.12644958496094, 55.317874908447266, 56.509300231933594, 57.70072937011719, 58.892154693603516, 60.083580017089844, 61.27500915527344, 62.466434478759766, 63.657859802246094, 64.84928894042969]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 4.0, 5.0, 7.0, 6.0, 7.0, 24.0, 8.0, 20.0, 25.0, 25.0, 29.0, 46.0, 27.0, 51.0, 51.0, 46.0, 43.0, 62.0, 55.0, 51.0, 50.0, 47.0, 36.0, 30.0, 45.0, 27.0, 35.0, 29.0, 29.0, 24.0, 12.0, 12.0, 6.0, 8.0, 12.0, 3.0, 5.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.992293357849121, -15.482062339782715, -14.971830368041992, -14.461599349975586, -13.951367378234863, -13.441136360168457, -12.930904388427734, -12.420673370361328, -11.910442352294922, -11.400211334228516, -10.889979362487793, -10.379748344421387, -9.869516372680664, -9.359285354614258, -8.849054336547852, -8.338822364807129, -7.828590393066406, -7.318358898162842, -6.808127403259277, -6.297896385192871, -5.787664413452148, -5.277433395385742, -4.767201900482178, -4.256970405578613, -3.746738910675049, -3.2365074157714844, -2.72627592086792, -2.2160446643829346, -1.7058131694793701, -1.1955816745758057, -0.6853504180908203, -0.17511892318725586, 0.3351116180419922, 0.8453430533409119, 1.3555744886398315, 1.8658058643341064, 2.376037359237671, 2.8862688541412354, 3.3965001106262207, 3.906731605529785, 4.41696310043335, 4.927194595336914, 5.4374260902404785, 5.947657585144043, 6.457888603210449, 6.968120574951172, 7.478351593017578, 7.988583087921143, 8.498814582824707, 9.009045600891113, 9.519277572631836, 10.029508590698242, 10.539740562438965, 11.049971580505371, 11.560203552246094, 12.0704345703125, 12.580665588378906, 13.090896606445312, 13.601128578186035, 14.111359596252441, 14.621591567993164, 15.13182258605957, 15.642053604125977, 16.152286529541016, 16.662517547607422]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 4.0, 4.0, 8.0, 9.0, 10.0, 15.0, 19.0, 23.0, 35.0, 46.0, 73.0, 123.0, 175.0, 297.0, 584.0, 1131.0, 2652.0, 7302.0, 30275.0, 510423.0, 3583442.0, 42442.0, 9484.0, 3093.0, 1295.0, 587.0, 319.0, 155.0, 91.0, 48.0, 40.0, 27.0, 21.0, 10.0, 5.0, 4.0, 2.0, 3.0, 4.0, 0.0, 0.0, 1.0], "bins": [-8.3515625, -8.15313720703125, -7.9547119140625, -7.75628662109375, -7.557861328125, -7.35943603515625, -7.1610107421875, -6.96258544921875, -6.76416015625, -6.56573486328125, -6.3673095703125, -6.16888427734375, -5.970458984375, -5.77203369140625, -5.5736083984375, -5.37518310546875, -5.1767578125, -4.97833251953125, -4.7799072265625, -4.58148193359375, -4.383056640625, -4.18463134765625, -3.9862060546875, -3.78778076171875, -3.58935546875, -3.39093017578125, -3.1925048828125, -2.99407958984375, -2.795654296875, -2.59722900390625, -2.3988037109375, -2.20037841796875, -2.001953125, -1.80352783203125, -1.6051025390625, -1.40667724609375, -1.208251953125, -1.00982666015625, -0.8114013671875, -0.61297607421875, -0.41455078125, -0.21612548828125, -0.0177001953125, 0.18072509765625, 0.379150390625, 0.57757568359375, 0.7760009765625, 0.97442626953125, 1.1728515625, 1.37127685546875, 1.5697021484375, 1.76812744140625, 1.966552734375, 2.16497802734375, 2.3634033203125, 2.56182861328125, 2.76025390625, 2.95867919921875, 3.1571044921875, 3.35552978515625, 3.553955078125, 3.75238037109375, 3.9508056640625, 4.14923095703125, 4.34765625]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 3.0, 4.0, 2.0, 8.0, 13.0, 11.0, 20.0, 22.0, 40.0, 45.0, 71.0, 61.0, 59.0, 74.0, 87.0, 86.0, 80.0, 61.0, 60.0, 58.0, 43.0, 37.0, 22.0, 13.0, 11.0, 9.0, 2.0, 0.0, 2.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-1.873046875, -1.8291244506835938, -1.7852020263671875, -1.7412796020507812, -1.697357177734375, -1.6534347534179688, -1.6095123291015625, -1.5655899047851562, -1.52166748046875, -1.4777450561523438, -1.4338226318359375, -1.3899002075195312, -1.345977783203125, -1.3020553588867188, -1.2581329345703125, -1.2142105102539062, -1.1702880859375, -1.1263656616210938, -1.0824432373046875, -1.0385208129882812, -0.994598388671875, -0.9506759643554688, -0.9067535400390625, -0.8628311157226562, -0.81890869140625, -0.7749862670898438, -0.7310638427734375, -0.6871414184570312, -0.643218994140625, -0.5992965698242188, -0.5553741455078125, -0.5114517211914062, -0.467529296875, -0.42360687255859375, -0.3796844482421875, -0.33576202392578125, -0.291839599609375, -0.24791717529296875, -0.2039947509765625, -0.16007232666015625, -0.11614990234375, -0.07222747802734375, -0.0283050537109375, 0.01561737060546875, 0.059539794921875, 0.10346221923828125, 0.1473846435546875, 0.19130706787109375, 0.2352294921875, 0.27915191650390625, 0.3230743408203125, 0.36699676513671875, 0.410919189453125, 0.45484161376953125, 0.4987640380859375, 0.5426864624023438, 0.58660888671875, 0.6305313110351562, 0.6744537353515625, 0.7183761596679688, 0.762298583984375, 0.8062210083007812, 0.8501434326171875, 0.8940658569335938, 0.93798828125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 2.0, 6.0, 5.0, 11.0, 13.0, 20.0, 29.0, 39.0, 73.0, 119.0, 193.0, 325.0, 650.0, 1493.0, 4748.0, 29092.0, 3659930.0, 472522.0, 18510.0, 3852.0, 1279.0, 611.0, 306.0, 154.0, 124.0, 61.0, 37.0, 23.0, 13.0, 16.0, 7.0, 5.0, 7.0, 8.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.453125, -9.2100830078125, -8.967041015625, -8.7239990234375, -8.48095703125, -8.2379150390625, -7.994873046875, -7.7518310546875, -7.5087890625, -7.2657470703125, -7.022705078125, -6.7796630859375, -6.53662109375, -6.2935791015625, -6.050537109375, -5.8074951171875, -5.564453125, -5.3214111328125, -5.078369140625, -4.8353271484375, -4.59228515625, -4.3492431640625, -4.106201171875, -3.8631591796875, -3.6201171875, -3.3770751953125, -3.134033203125, -2.8909912109375, -2.64794921875, -2.4049072265625, -2.161865234375, -1.9188232421875, -1.67578125, -1.4327392578125, -1.189697265625, -0.9466552734375, -0.70361328125, -0.4605712890625, -0.217529296875, 0.0255126953125, 0.2685546875, 0.5115966796875, 0.754638671875, 0.9976806640625, 1.24072265625, 1.4837646484375, 1.726806640625, 1.9698486328125, 2.212890625, 2.4559326171875, 2.698974609375, 2.9420166015625, 3.18505859375, 3.4281005859375, 3.671142578125, 3.9141845703125, 4.1572265625, 4.4002685546875, 4.643310546875, 4.8863525390625, 5.12939453125, 5.3724365234375, 5.615478515625, 5.8585205078125, 6.1015625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 7.0, 5.0, 9.0, 21.0, 55.0, 109.0, 630.0, 2856.0, 207.0, 83.0, 32.0, 26.0, 14.0, 5.0, 8.0, 3.0, 4.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.046875, -3.943695068359375, -3.84051513671875, -3.737335205078125, -3.6341552734375, -3.530975341796875, -3.42779541015625, -3.324615478515625, -3.221435546875, -3.118255615234375, -3.01507568359375, -2.911895751953125, -2.8087158203125, -2.705535888671875, -2.60235595703125, -2.499176025390625, -2.39599609375, -2.292816162109375, -2.18963623046875, -2.086456298828125, -1.9832763671875, -1.880096435546875, -1.77691650390625, -1.673736572265625, -1.570556640625, -1.467376708984375, -1.36419677734375, -1.261016845703125, -1.1578369140625, -1.054656982421875, -0.95147705078125, -0.848297119140625, -0.7451171875, -0.641937255859375, -0.53875732421875, -0.435577392578125, -0.3323974609375, -0.229217529296875, -0.12603759765625, -0.022857666015625, 0.080322265625, 0.183502197265625, 0.28668212890625, 0.389862060546875, 0.4930419921875, 0.596221923828125, 0.69940185546875, 0.802581787109375, 0.90576171875, 1.008941650390625, 1.11212158203125, 1.215301513671875, 1.3184814453125, 1.421661376953125, 1.52484130859375, 1.628021240234375, 1.731201171875, 1.834381103515625, 1.93756103515625, 2.040740966796875, 2.1439208984375, 2.247100830078125, 2.35028076171875, 2.453460693359375, 2.556640625]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 9.0, 66.0, 717.0, 188.0, 25.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.32317352294922, -15.828619956970215, -14.334067344665527, -12.839513778686523, -11.344961166381836, -9.850407600402832, -8.355854034423828, -6.861301422119141, -5.366747856140137, -3.872194766998291, -2.377641439437866, -0.8830881118774414, 0.6114649772644043, 2.10601806640625, 3.600571632385254, 5.095124244689941, 6.589677810668945, 8.08423137664795, 9.578783988952637, 11.07333755493164, 12.567890167236328, 14.062443733215332, 15.556997299194336, 17.051549911499023, 18.546104431152344, 20.04065704345703, 21.53521156311035, 23.02976417541504, 24.524316787719727, 26.018871307373047, 27.513423919677734, 29.007976531982422, 30.50252914428711, 31.997081756591797, 33.491634368896484, 34.98619079589844, 36.480743408203125, 37.97529602050781, 39.4698486328125, 40.96440124511719, 42.458953857421875, 43.95350646972656, 45.44805908203125, 46.94261169433594, 48.43716812133789, 49.93172073364258, 51.426273345947266, 52.92082595825195, 54.415382385253906, 55.909934997558594, 57.40448760986328, 58.89904022216797, 60.39359664916992, 61.88814926147461, 63.3827018737793, 64.87725830078125, 66.3718032836914, 67.8663558959961, 69.36090850830078, 70.85546112060547, 72.35001373291016, 73.84456634521484, 75.33912658691406, 76.83367919921875, 78.32823181152344]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 7.0, 2.0, 5.0, 14.0, 20.0, 23.0, 26.0, 46.0, 48.0, 62.0, 55.0, 66.0, 89.0, 67.0, 67.0, 73.0, 69.0, 57.0, 49.0, 54.0, 25.0, 25.0, 13.0, 19.0, 6.0, 8.0, 6.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.762116432189941, -7.51392126083374, -7.265726089477539, -7.01753044128418, -6.7693352699279785, -6.521140098571777, -6.272944927215576, -6.024749755859375, -5.776554107666016, -5.5283589363098145, -5.280163764953613, -5.031968116760254, -4.783772945404053, -4.535577774047852, -4.28738260269165, -4.039187431335449, -3.790992021560669, -3.5427968502044678, -3.2946014404296875, -3.0464062690734863, -2.798210859298706, -2.550015687942505, -2.3018202781677246, -2.0536251068115234, -1.8054298162460327, -1.557234525680542, -1.3090392351150513, -1.0608439445495605, -0.8126487135887146, -0.5644534826278687, -0.31625819206237793, -0.06806290149688721, 0.18013238906860352, 0.42832767963409424, 0.676522970199585, 0.9247182011604309, 1.1729135513305664, 1.4211087226867676, 1.6693040132522583, 1.917499303817749, 2.1656947135925293, 2.4138898849487305, 2.6620852947235107, 2.910280466079712, 3.158475875854492, 3.4066710472106934, 3.6548662185668945, 3.903061628341675, 4.151256561279297, 4.399451732635498, 4.647646903991699, 4.895842552185059, 5.14403772354126, 5.392232894897461, 5.640428066253662, 5.888623237609863, 6.136818885803223, 6.385014057159424, 6.633209228515625, 6.881404876708984, 7.1296000480651855, 7.377795219421387, 7.625990390777588, 7.874185562133789, 8.122381210327148]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 6.0, 6.0, 5.0, 22.0, 23.0, 30.0, 36.0, 116.0, 198.0, 382.0, 808.0, 2350.0, 10356.0, 73634.0, 592878.0, 323461.0, 35370.0, 6009.0, 1616.0, 612.0, 279.0, 153.0, 73.0, 50.0, 34.0, 15.0, 11.0, 9.0, 5.0, 5.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.89453125, -4.70501708984375, -4.5155029296875, -4.32598876953125, -4.136474609375, -3.94696044921875, -3.7574462890625, -3.56793212890625, -3.37841796875, -3.18890380859375, -2.9993896484375, -2.80987548828125, -2.620361328125, -2.43084716796875, -2.2413330078125, -2.05181884765625, -1.8623046875, -1.67279052734375, -1.4832763671875, -1.29376220703125, -1.104248046875, -0.91473388671875, -0.7252197265625, -0.53570556640625, -0.34619140625, -0.15667724609375, 0.0328369140625, 0.22235107421875, 0.411865234375, 0.60137939453125, 0.7908935546875, 0.98040771484375, 1.169921875, 1.35943603515625, 1.5489501953125, 1.73846435546875, 1.927978515625, 2.11749267578125, 2.3070068359375, 2.49652099609375, 2.68603515625, 2.87554931640625, 3.0650634765625, 3.25457763671875, 3.444091796875, 3.63360595703125, 3.8231201171875, 4.01263427734375, 4.2021484375, 4.39166259765625, 4.5811767578125, 4.77069091796875, 4.960205078125, 5.14971923828125, 5.3392333984375, 5.52874755859375, 5.71826171875, 5.90777587890625, 6.0972900390625, 6.28680419921875, 6.476318359375, 6.66583251953125, 6.8553466796875, 7.04486083984375, 7.234375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 3.0, 6.0, 10.0, 16.0, 19.0, 20.0, 28.0, 36.0, 49.0, 70.0, 82.0, 76.0, 86.0, 65.0, 89.0, 86.0, 63.0, 50.0, 43.0, 37.0, 21.0, 16.0, 11.0, 10.0, 2.0, 2.0, 1.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.9326171875, -1.88653564453125, -1.8404541015625, -1.79437255859375, -1.748291015625, -1.70220947265625, -1.6561279296875, -1.61004638671875, -1.56396484375, -1.51788330078125, -1.4718017578125, -1.42572021484375, -1.379638671875, -1.33355712890625, -1.2874755859375, -1.24139404296875, -1.1953125, -1.14923095703125, -1.1031494140625, -1.05706787109375, -1.010986328125, -0.96490478515625, -0.9188232421875, -0.87274169921875, -0.82666015625, -0.78057861328125, -0.7344970703125, -0.68841552734375, -0.642333984375, -0.59625244140625, -0.5501708984375, -0.50408935546875, -0.4580078125, -0.41192626953125, -0.3658447265625, -0.31976318359375, -0.273681640625, -0.22760009765625, -0.1815185546875, -0.13543701171875, -0.08935546875, -0.04327392578125, 0.0028076171875, 0.04888916015625, 0.094970703125, 0.14105224609375, 0.1871337890625, 0.23321533203125, 0.279296875, 0.32537841796875, 0.3714599609375, 0.41754150390625, 0.463623046875, 0.50970458984375, 0.5557861328125, 0.60186767578125, 0.64794921875, 0.69403076171875, 0.7401123046875, 0.78619384765625, 0.832275390625, 0.87835693359375, 0.9244384765625, 0.97052001953125, 1.0166015625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 4.0, 7.0, 4.0, 9.0, 10.0, 12.0, 19.0, 38.0, 66.0, 104.0, 193.0, 440.0, 974.0, 2976.0, 12632.0, 82757.0, 544433.0, 346704.0, 45649.0, 7832.0, 2081.0, 746.0, 376.0, 218.0, 108.0, 57.0, 36.0, 23.0, 16.0, 7.0, 8.0, 7.0, 5.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5234375, -4.3857421875, -4.248046875, -4.1103515625, -3.97265625, -3.8349609375, -3.697265625, -3.5595703125, -3.421875, -3.2841796875, -3.146484375, -3.0087890625, -2.87109375, -2.7333984375, -2.595703125, -2.4580078125, -2.3203125, -2.1826171875, -2.044921875, -1.9072265625, -1.76953125, -1.6318359375, -1.494140625, -1.3564453125, -1.21875, -1.0810546875, -0.943359375, -0.8056640625, -0.66796875, -0.5302734375, -0.392578125, -0.2548828125, -0.1171875, 0.0205078125, 0.158203125, 0.2958984375, 0.43359375, 0.5712890625, 0.708984375, 0.8466796875, 0.984375, 1.1220703125, 1.259765625, 1.3974609375, 1.53515625, 1.6728515625, 1.810546875, 1.9482421875, 2.0859375, 2.2236328125, 2.361328125, 2.4990234375, 2.63671875, 2.7744140625, 2.912109375, 3.0498046875, 3.1875, 3.3251953125, 3.462890625, 3.6005859375, 3.73828125, 3.8759765625, 4.013671875, 4.1513671875, 4.2890625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 3.0, 3.0, 8.0, 7.0, 8.0, 14.0, 14.0, 28.0, 30.0, 32.0, 33.0, 49.0, 49.0, 64.0, 47.0, 60.0, 72.0, 70.0, 66.0, 57.0, 53.0, 38.0, 41.0, 38.0, 33.0, 21.0, 19.0, 12.0, 8.0, 9.0, 3.0, 6.0, 4.0, 5.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.265625, -4.0994873046875, -3.933349609375, -3.7672119140625, -3.60107421875, -3.4349365234375, -3.268798828125, -3.1026611328125, -2.9365234375, -2.7703857421875, -2.604248046875, -2.4381103515625, -2.27197265625, -2.1058349609375, -1.939697265625, -1.7735595703125, -1.607421875, -1.4412841796875, -1.275146484375, -1.1090087890625, -0.94287109375, -0.7767333984375, -0.610595703125, -0.4444580078125, -0.2783203125, -0.1121826171875, 0.053955078125, 0.2200927734375, 0.38623046875, 0.5523681640625, 0.718505859375, 0.8846435546875, 1.05078125, 1.2169189453125, 1.383056640625, 1.5491943359375, 1.71533203125, 1.8814697265625, 2.047607421875, 2.2137451171875, 2.3798828125, 2.5460205078125, 2.712158203125, 2.8782958984375, 3.04443359375, 3.2105712890625, 3.376708984375, 3.5428466796875, 3.708984375, 3.8751220703125, 4.041259765625, 4.2073974609375, 4.37353515625, 4.5396728515625, 4.705810546875, 4.8719482421875, 5.0380859375, 5.2042236328125, 5.370361328125, 5.5364990234375, 5.70263671875, 5.8687744140625, 6.034912109375, 6.2010498046875, 6.3671875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 6.0, 8.0, 8.0, 24.0, 60.0, 140.0, 392.0, 1184.0, 8490.0, 544926.0, 483666.0, 7849.0, 1195.0, 335.0, 166.0, 59.0, 23.0, 9.0, 10.0, 6.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.490234375, -3.350555419921875, -3.21087646484375, -3.071197509765625, -2.9315185546875, -2.791839599609375, -2.65216064453125, -2.512481689453125, -2.372802734375, -2.233123779296875, -2.09344482421875, -1.953765869140625, -1.8140869140625, -1.674407958984375, -1.53472900390625, -1.395050048828125, -1.25537109375, -1.115692138671875, -0.97601318359375, -0.836334228515625, -0.6966552734375, -0.556976318359375, -0.41729736328125, -0.277618408203125, -0.137939453125, 0.001739501953125, 0.14141845703125, 0.281097412109375, 0.4207763671875, 0.560455322265625, 0.70013427734375, 0.839813232421875, 0.9794921875, 1.119171142578125, 1.25885009765625, 1.398529052734375, 1.5382080078125, 1.677886962890625, 1.81756591796875, 1.957244873046875, 2.096923828125, 2.236602783203125, 2.37628173828125, 2.515960693359375, 2.6556396484375, 2.795318603515625, 2.93499755859375, 3.074676513671875, 3.21435546875, 3.354034423828125, 3.49371337890625, 3.633392333984375, 3.7730712890625, 3.912750244140625, 4.05242919921875, 4.192108154296875, 4.331787109375, 4.471466064453125, 4.61114501953125, 4.750823974609375, 4.8905029296875, 5.030181884765625, 5.16986083984375, 5.309539794921875, 5.44921875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 1.0, 2.0, 3.0, 7.0, 10.0, 7.0, 10.0, 16.0, 22.0, 29.0, 46.0, 57.0, 96.0, 107.0, 134.0, 122.0, 86.0, 56.0, 55.0, 31.0, 33.0, 26.0, 12.0, 10.0, 5.0, 4.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00025534629821777344, -0.00024670735001564026, -0.00023806840181350708, -0.0002294294536113739, -0.00022079050540924072, -0.00021215155720710754, -0.00020351260900497437, -0.0001948736608028412, -0.000186234712600708, -0.00017759576439857483, -0.00016895681619644165, -0.00016031786799430847, -0.0001516789197921753, -0.00014303997159004211, -0.00013440102338790894, -0.00012576207518577576, -0.00011712312698364258, -0.0001084841787815094, -9.984523057937622e-05, -9.120628237724304e-05, -8.256733417510986e-05, -7.392838597297668e-05, -6.52894377708435e-05, -5.665048956871033e-05, -4.801154136657715e-05, -3.937259316444397e-05, -3.073364496231079e-05, -2.2094696760177612e-05, -1.3455748558044434e-05, -4.816800355911255e-06, 3.822147846221924e-06, 1.2461096048355103e-05, 2.110004425048828e-05, 2.973899245262146e-05, 3.837794065475464e-05, 4.701688885688782e-05, 5.5655837059020996e-05, 6.429478526115417e-05, 7.293373346328735e-05, 8.157268166542053e-05, 9.021162986755371e-05, 9.885057806968689e-05, 0.00010748952627182007, 0.00011612847447395325, 0.00012476742267608643, 0.0001334063708782196, 0.00014204531908035278, 0.00015068426728248596, 0.00015932321548461914, 0.00016796216368675232, 0.0001766011118888855, 0.00018524006009101868, 0.00019387900829315186, 0.00020251795649528503, 0.0002111569046974182, 0.0002197958528995514, 0.00022843480110168457, 0.00023707374930381775, 0.00024571269750595093, 0.0002543516457080841, 0.0002629905939102173, 0.00027162954211235046, 0.00028026849031448364, 0.0002889074385166168, 0.00029754638671875]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 4.0, 11.0, 20.0, 18.0, 39.0, 57.0, 76.0, 146.0, 300.0, 755.0, 3476.0, 42081.0, 848365.0, 143814.0, 7275.0, 1237.0, 384.0, 200.0, 115.0, 70.0, 44.0, 26.0, 15.0, 17.0, 5.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.884765625, -3.7694091796875, -3.654052734375, -3.5386962890625, -3.42333984375, -3.3079833984375, -3.192626953125, -3.0772705078125, -2.9619140625, -2.8465576171875, -2.731201171875, -2.6158447265625, -2.50048828125, -2.3851318359375, -2.269775390625, -2.1544189453125, -2.0390625, -1.9237060546875, -1.808349609375, -1.6929931640625, -1.57763671875, -1.4622802734375, -1.346923828125, -1.2315673828125, -1.1162109375, -1.0008544921875, -0.885498046875, -0.7701416015625, -0.65478515625, -0.5394287109375, -0.424072265625, -0.3087158203125, -0.193359375, -0.0780029296875, 0.037353515625, 0.1527099609375, 0.26806640625, 0.3834228515625, 0.498779296875, 0.6141357421875, 0.7294921875, 0.8448486328125, 0.960205078125, 1.0755615234375, 1.19091796875, 1.3062744140625, 1.421630859375, 1.5369873046875, 1.65234375, 1.7677001953125, 1.883056640625, 1.9984130859375, 2.11376953125, 2.2291259765625, 2.344482421875, 2.4598388671875, 2.5751953125, 2.6905517578125, 2.805908203125, 2.9212646484375, 3.03662109375, 3.1519775390625, 3.267333984375, 3.3826904296875, 3.498046875]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 7.0, 4.0, 5.0, 3.0, 17.0, 16.0, 24.0, 37.0, 78.0, 97.0, 168.0, 151.0, 143.0, 87.0, 61.0, 35.0, 36.0, 16.0, 11.0, 9.0, 5.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1357421875, -1.0433502197265625, -0.950958251953125, -0.8585662841796875, -0.76617431640625, -0.6737823486328125, -0.581390380859375, -0.4889984130859375, -0.3966064453125, -0.3042144775390625, -0.211822509765625, -0.1194305419921875, -0.02703857421875, 0.0653533935546875, 0.157745361328125, 0.2501373291015625, 0.342529296875, 0.4349212646484375, 0.527313232421875, 0.6197052001953125, 0.71209716796875, 0.8044891357421875, 0.896881103515625, 0.9892730712890625, 1.0816650390625, 1.1740570068359375, 1.266448974609375, 1.3588409423828125, 1.45123291015625, 1.5436248779296875, 1.636016845703125, 1.7284088134765625, 1.82080078125, 1.9131927490234375, 2.005584716796875, 2.0979766845703125, 2.19036865234375, 2.2827606201171875, 2.375152587890625, 2.4675445556640625, 2.5599365234375, 2.6523284912109375, 2.744720458984375, 2.8371124267578125, 2.92950439453125, 3.0218963623046875, 3.114288330078125, 3.2066802978515625, 3.299072265625, 3.3914642333984375, 3.483856201171875, 3.5762481689453125, 3.66864013671875, 3.7610321044921875, 3.853424072265625, 3.9458160400390625, 4.0382080078125, 4.1305999755859375, 4.222991943359375, 4.3153839111328125, 4.40777587890625, 4.5001678466796875, 4.592559814453125, 4.6849517822265625, 4.77734375]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 10.0, 58.0, 173.0, 380.0, 281.0, 86.0, 16.0, 8.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.46617126464844, -31.035585403442383, -28.604999542236328, -26.17441177368164, -23.743825912475586, -21.31324005126953, -18.882652282714844, -16.45206642150879, -14.021480560302734, -11.59089469909668, -9.160307884216309, -6.729721546173096, -4.299135208129883, -1.8685493469238281, 0.562037467956543, 2.992624282836914, 5.423210144042969, 7.853796482086182, 10.284382820129395, 12.714969635009766, 15.14555549621582, 17.576141357421875, 20.006729125976562, 22.437314987182617, 24.867900848388672, 27.298486709594727, 29.72907257080078, 32.15966033935547, 34.590248107910156, 37.02083206176758, 39.451419830322266, 41.88200378417969, 44.312591552734375, 46.74317932128906, 49.173763275146484, 51.60435104370117, 54.034934997558594, 56.46552276611328, 58.89611053466797, 61.326698303222656, 63.75728225708008, 66.1878662109375, 68.61845397949219, 71.04904174804688, 73.47962951660156, 75.91021728515625, 78.3407974243164, 80.7713851928711, 83.20197296142578, 85.63256072998047, 88.06314849853516, 90.49372863769531, 92.92431640625, 95.35490417480469, 97.78549194335938, 100.21607971191406, 102.64666748046875, 105.07725524902344, 107.50784301757812, 109.93842315673828, 112.36901092529297, 114.79959869384766, 117.23018646240234, 119.66077423095703, 122.09135437011719]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 4.0, 3.0, 5.0, 8.0, 13.0, 6.0, 12.0, 15.0, 11.0, 13.0, 18.0, 20.0, 18.0, 28.0, 19.0, 28.0, 27.0, 25.0, 34.0, 29.0, 34.0, 43.0, 43.0, 28.0, 44.0, 46.0, 32.0, 49.0, 44.0, 34.0, 35.0, 29.0, 26.0, 19.0, 23.0, 15.0, 20.0, 13.0, 10.0, 13.0, 10.0, 11.0, 10.0, 5.0, 6.0, 7.0, 6.0, 5.0, 2.0, 3.0, 5.0, 1.0, 4.0, 0.0, 0.0, 2.0], "bins": [-20.601903915405273, -19.95659828186035, -19.311290740966797, -18.665985107421875, -18.020679473876953, -17.3753719329834, -16.730066299438477, -16.084758758544922, -15.439453125, -14.794146537780762, -14.148839950561523, -13.503534317016602, -12.858227729797363, -12.212921142578125, -11.567615509033203, -10.922308921813965, -10.277002334594727, -9.631695747375488, -8.98638916015625, -8.341083526611328, -7.69577693939209, -7.050470352172852, -6.4051642417907715, -5.759858131408691, -5.114551544189453, -4.469244956970215, -3.8239388465881348, -3.1786324977874756, -2.5333261489868164, -1.8880198001861572, -1.242713451385498, -0.597407341003418, 0.0478973388671875, 0.6932036876678467, 1.3385100364685059, 1.983816385269165, 2.629122734069824, 3.2744290828704834, 3.9197354316711426, 4.565041542053223, 5.210348129272461, 5.855654716491699, 6.500960826873779, 7.146266937255859, 7.791573524475098, 8.436880111694336, 9.082185745239258, 9.727492332458496, 10.372798919677734, 11.018105506896973, 11.663412094116211, 12.308717727661133, 12.954024314880371, 13.59933090209961, 14.244636535644531, 14.88994312286377, 15.535249710083008, 16.18055534362793, 16.825862884521484, 17.471168518066406, 18.116474151611328, 18.761781692504883, 19.407087326049805, 20.05239486694336, 20.69770050048828]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 5.0, 2.0, 2.0, 4.0, 2.0, 6.0, 6.0, 10.0, 11.0, 10.0, 15.0, 17.0, 27.0, 31.0, 43.0, 69.0, 78.0, 123.0, 210.0, 359.0, 669.0, 1446.0, 3103.0, 7406.0, 21046.0, 92568.0, 3570029.0, 426619.0, 46893.0, 13451.0, 5309.0, 2272.0, 1121.0, 548.0, 330.0, 151.0, 106.0, 61.0, 46.0, 23.0, 24.0, 12.0, 11.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.734375, -5.569580078125, -5.40478515625, -5.239990234375, -5.0751953125, -4.910400390625, -4.74560546875, -4.580810546875, -4.416015625, -4.251220703125, -4.08642578125, -3.921630859375, -3.7568359375, -3.592041015625, -3.42724609375, -3.262451171875, -3.09765625, -2.932861328125, -2.76806640625, -2.603271484375, -2.4384765625, -2.273681640625, -2.10888671875, -1.944091796875, -1.779296875, -1.614501953125, -1.44970703125, -1.284912109375, -1.1201171875, -0.955322265625, -0.79052734375, -0.625732421875, -0.4609375, -0.296142578125, -0.13134765625, 0.033447265625, 0.1982421875, 0.363037109375, 0.52783203125, 0.692626953125, 0.857421875, 1.022216796875, 1.18701171875, 1.351806640625, 1.5166015625, 1.681396484375, 1.84619140625, 2.010986328125, 2.17578125, 2.340576171875, 2.50537109375, 2.670166015625, 2.8349609375, 2.999755859375, 3.16455078125, 3.329345703125, 3.494140625, 3.658935546875, 3.82373046875, 3.988525390625, 4.1533203125, 4.318115234375, 4.48291015625, 4.647705078125, 4.8125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 5.0, 11.0, 7.0, 14.0, 17.0, 28.0, 28.0, 28.0, 40.0, 47.0, 50.0, 59.0, 74.0, 64.0, 58.0, 83.0, 69.0, 49.0, 66.0, 39.0, 41.0, 29.0, 20.0, 24.0, 7.0, 21.0, 8.0, 2.0, 5.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8681640625, -1.8194732666015625, -1.770782470703125, -1.7220916748046875, -1.67340087890625, -1.6247100830078125, -1.576019287109375, -1.5273284912109375, -1.4786376953125, -1.4299468994140625, -1.381256103515625, -1.3325653076171875, -1.28387451171875, -1.2351837158203125, -1.186492919921875, -1.1378021240234375, -1.089111328125, -1.0404205322265625, -0.991729736328125, -0.9430389404296875, -0.89434814453125, -0.8456573486328125, -0.796966552734375, -0.7482757568359375, -0.6995849609375, -0.6508941650390625, -0.602203369140625, -0.5535125732421875, -0.50482177734375, -0.4561309814453125, -0.407440185546875, -0.3587493896484375, -0.31005859375, -0.2613677978515625, -0.212677001953125, -0.1639862060546875, -0.11529541015625, -0.0666046142578125, -0.017913818359375, 0.0307769775390625, 0.0794677734375, 0.1281585693359375, 0.176849365234375, 0.2255401611328125, 0.27423095703125, 0.3229217529296875, 0.371612548828125, 0.4203033447265625, 0.468994140625, 0.5176849365234375, 0.566375732421875, 0.6150665283203125, 0.66375732421875, 0.7124481201171875, 0.761138916015625, 0.8098297119140625, 0.8585205078125, 0.9072113037109375, 0.955902099609375, 1.0045928955078125, 1.05328369140625, 1.1019744873046875, 1.150665283203125, 1.1993560791015625, 1.248046875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 4.0, 3.0, 5.0, 6.0, 6.0, 13.0, 9.0, 28.0, 29.0, 45.0, 73.0, 112.0, 219.0, 399.0, 838.0, 1612.0, 3819.0, 9868.0, 30825.0, 147577.0, 3527160.0, 393714.0, 53047.0, 14817.0, 5495.0, 2304.0, 1066.0, 510.0, 297.0, 165.0, 75.0, 44.0, 27.0, 33.0, 18.0, 11.0, 11.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.9296875, -4.791595458984375, -4.65350341796875, -4.515411376953125, -4.3773193359375, -4.239227294921875, -4.10113525390625, -3.963043212890625, -3.824951171875, -3.686859130859375, -3.54876708984375, -3.410675048828125, -3.2725830078125, -3.134490966796875, -2.99639892578125, -2.858306884765625, -2.72021484375, -2.582122802734375, -2.44403076171875, -2.305938720703125, -2.1678466796875, -2.029754638671875, -1.89166259765625, -1.753570556640625, -1.615478515625, -1.477386474609375, -1.33929443359375, -1.201202392578125, -1.0631103515625, -0.925018310546875, -0.78692626953125, -0.648834228515625, -0.5107421875, -0.372650146484375, -0.23455810546875, -0.096466064453125, 0.0416259765625, 0.179718017578125, 0.31781005859375, 0.455902099609375, 0.593994140625, 0.732086181640625, 0.87017822265625, 1.008270263671875, 1.1463623046875, 1.284454345703125, 1.42254638671875, 1.560638427734375, 1.69873046875, 1.836822509765625, 1.97491455078125, 2.113006591796875, 2.2510986328125, 2.389190673828125, 2.52728271484375, 2.665374755859375, 2.803466796875, 2.941558837890625, 3.07965087890625, 3.217742919921875, 3.3558349609375, 3.493927001953125, 3.63201904296875, 3.770111083984375, 3.908203125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 0.0, 4.0, 9.0, 10.0, 9.0, 11.0, 15.0, 16.0, 25.0, 45.0, 39.0, 62.0, 139.0, 275.0, 1252.0, 1426.0, 298.0, 151.0, 73.0, 50.0, 32.0, 29.0, 24.0, 19.0, 7.0, 12.0, 6.0, 5.0, 4.0, 5.0, 4.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0], "bins": [-2.630859375, -2.56512451171875, -2.4993896484375, -2.43365478515625, -2.367919921875, -2.30218505859375, -2.2364501953125, -2.17071533203125, -2.10498046875, -2.03924560546875, -1.9735107421875, -1.90777587890625, -1.842041015625, -1.77630615234375, -1.7105712890625, -1.64483642578125, -1.5791015625, -1.51336669921875, -1.4476318359375, -1.38189697265625, -1.316162109375, -1.25042724609375, -1.1846923828125, -1.11895751953125, -1.05322265625, -0.98748779296875, -0.9217529296875, -0.85601806640625, -0.790283203125, -0.72454833984375, -0.6588134765625, -0.59307861328125, -0.52734375, -0.46160888671875, -0.3958740234375, -0.33013916015625, -0.264404296875, -0.19866943359375, -0.1329345703125, -0.06719970703125, -0.00146484375, 0.06427001953125, 0.1300048828125, 0.19573974609375, 0.261474609375, 0.32720947265625, 0.3929443359375, 0.45867919921875, 0.5244140625, 0.59014892578125, 0.6558837890625, 0.72161865234375, 0.787353515625, 0.85308837890625, 0.9188232421875, 0.98455810546875, 1.05029296875, 1.11602783203125, 1.1817626953125, 1.24749755859375, 1.313232421875, 1.37896728515625, 1.4447021484375, 1.51043701171875, 1.576171875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 9.0, 25.0, 144.0, 410.0, 295.0, 86.0, 24.0, 7.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.44594955444336, -27.330509185791016, -26.215070724487305, -25.099632263183594, -23.98419189453125, -22.868751525878906, -21.753313064575195, -20.637874603271484, -19.52243423461914, -18.406993865966797, -17.291555404663086, -16.176116943359375, -15.060676574707031, -13.945237159729004, -12.829797744750977, -11.71435832977295, -10.598918914794922, -9.483479499816895, -8.368040084838867, -7.25260066986084, -6.1371612548828125, -5.021721839904785, -3.906282424926758, -2.7908430099487305, -1.6754035949707031, -0.5599641799926758, 0.5554752349853516, 1.670914649963379, 2.7863540649414062, 3.9017934799194336, 5.017232894897461, 6.132672309875488, 7.24810791015625, 8.363547325134277, 9.478986740112305, 10.594426155090332, 11.70986557006836, 12.825304985046387, 13.940744400024414, 15.056183815002441, 16.17162322998047, 17.287063598632812, 18.402502059936523, 19.517940521240234, 20.633380889892578, 21.748821258544922, 22.864259719848633, 23.979698181152344, 25.095138549804688, 26.21057891845703, 27.326017379760742, 28.441455841064453, 29.556896209716797, 30.67233657836914, 31.78777503967285, 32.90321350097656, 34.018653869628906, 35.13409423828125, 36.249534606933594, 37.36497116088867, 38.480411529541016, 39.59585189819336, 40.71128845214844, 41.82672882080078, 42.942169189453125]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 3.0, 3.0, 6.0, 8.0, 12.0, 14.0, 12.0, 11.0, 16.0, 31.0, 43.0, 37.0, 40.0, 43.0, 51.0, 77.0, 53.0, 66.0, 48.0, 66.0, 47.0, 45.0, 41.0, 36.0, 35.0, 33.0, 28.0, 28.0, 16.0, 14.0, 13.0, 11.0, 6.0, 6.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0], "bins": [-11.73771858215332, -11.449079513549805, -11.160440444946289, -10.871801376342773, -10.583162307739258, -10.294523239135742, -10.005884170532227, -9.717246055603027, -9.428606986999512, -9.139967918395996, -8.85132884979248, -8.562689781188965, -8.27405071258545, -7.985412120819092, -7.696773052215576, -7.408134460449219, -7.119494915008545, -6.830855846405029, -6.542216777801514, -6.253578186035156, -5.964939117431641, -5.676300048828125, -5.387660980224609, -5.099021911621094, -4.810382843017578, -4.5217437744140625, -4.233104705810547, -3.9444658756256104, -3.655827045440674, -3.367187976837158, -3.0785489082336426, -2.789910078048706, -2.5012712478637695, -2.212632179260254, -1.9239933490753174, -1.6353542804718018, -1.3467153310775757, -1.0580763816833496, -0.769437313079834, -0.48079848289489746, -0.19215941429138184, 0.09647956490516663, 0.3851185441017151, 0.6737575531005859, 0.962396502494812, 1.251035451889038, 1.5396745204925537, 1.8283133506774902, 2.116952419281006, 2.4055914878845215, 2.694230318069458, 2.9828693866729736, 3.27150821685791, 3.560147285461426, 3.8487863540649414, 4.137425422668457, 4.426064491271973, 4.714703559875488, 5.003342628479004, 5.2919816970825195, 5.580620288848877, 5.869259357452393, 6.157898426055908, 6.446537017822266, 6.735176086425781]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 10.0, 7.0, 8.0, 14.0, 15.0, 17.0, 37.0, 56.0, 97.0, 180.0, 217.0, 416.0, 927.0, 2127.0, 5582.0, 19696.0, 87092.0, 396062.0, 412371.0, 92575.0, 20870.0, 5937.0, 2192.0, 937.0, 457.0, 253.0, 149.0, 71.0, 63.0, 32.0, 25.0, 21.0, 10.0, 9.0, 7.0, 4.0, 6.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.8984375, -5.73468017578125, -5.5709228515625, -5.40716552734375, -5.243408203125, -5.07965087890625, -4.9158935546875, -4.75213623046875, -4.58837890625, -4.42462158203125, -4.2608642578125, -4.09710693359375, -3.933349609375, -3.76959228515625, -3.6058349609375, -3.44207763671875, -3.2783203125, -3.11456298828125, -2.9508056640625, -2.78704833984375, -2.623291015625, -2.45953369140625, -2.2957763671875, -2.13201904296875, -1.96826171875, -1.80450439453125, -1.6407470703125, -1.47698974609375, -1.313232421875, -1.14947509765625, -0.9857177734375, -0.82196044921875, -0.658203125, -0.49444580078125, -0.3306884765625, -0.16693115234375, -0.003173828125, 0.16058349609375, 0.3243408203125, 0.48809814453125, 0.65185546875, 0.81561279296875, 0.9793701171875, 1.14312744140625, 1.306884765625, 1.47064208984375, 1.6343994140625, 1.79815673828125, 1.9619140625, 2.12567138671875, 2.2894287109375, 2.45318603515625, 2.616943359375, 2.78070068359375, 2.9444580078125, 3.10821533203125, 3.27197265625, 3.43572998046875, 3.5994873046875, 3.76324462890625, 3.927001953125, 4.09075927734375, 4.2545166015625, 4.41827392578125, 4.58203125]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 7.0, 5.0, 6.0, 11.0, 19.0, 18.0, 22.0, 23.0, 33.0, 57.0, 59.0, 57.0, 68.0, 74.0, 70.0, 81.0, 71.0, 53.0, 58.0, 46.0, 39.0, 26.0, 32.0, 25.0, 17.0, 12.0, 6.0, 8.0, 4.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.048828125, -1.99578857421875, -1.9427490234375, -1.88970947265625, -1.836669921875, -1.78363037109375, -1.7305908203125, -1.67755126953125, -1.62451171875, -1.57147216796875, -1.5184326171875, -1.46539306640625, -1.412353515625, -1.35931396484375, -1.3062744140625, -1.25323486328125, -1.2001953125, -1.14715576171875, -1.0941162109375, -1.04107666015625, -0.988037109375, -0.93499755859375, -0.8819580078125, -0.82891845703125, -0.77587890625, -0.72283935546875, -0.6697998046875, -0.61676025390625, -0.563720703125, -0.51068115234375, -0.4576416015625, -0.40460205078125, -0.3515625, -0.29852294921875, -0.2454833984375, -0.19244384765625, -0.139404296875, -0.08636474609375, -0.0333251953125, 0.01971435546875, 0.07275390625, 0.12579345703125, 0.1788330078125, 0.23187255859375, 0.284912109375, 0.33795166015625, 0.3909912109375, 0.44403076171875, 0.4970703125, 0.55010986328125, 0.6031494140625, 0.65618896484375, 0.709228515625, 0.76226806640625, 0.8153076171875, 0.86834716796875, 0.92138671875, 0.97442626953125, 1.0274658203125, 1.08050537109375, 1.133544921875, 1.18658447265625, 1.2396240234375, 1.29266357421875, 1.345703125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 1.0, 3.0, 8.0, 1.0, 3.0, 8.0, 11.0, 8.0, 13.0, 16.0, 17.0, 41.0, 51.0, 68.0, 116.0, 205.0, 406.0, 742.0, 1670.0, 4147.0, 11935.0, 43059.0, 197930.0, 535032.0, 192162.0, 41792.0, 11754.0, 4077.0, 1628.0, 687.0, 372.0, 201.0, 122.0, 85.0, 49.0, 41.0, 19.0, 17.0, 14.0, 13.0, 7.0, 4.0, 6.0, 7.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.18359375, -4.04638671875, -3.9091796875, -3.77197265625, -3.634765625, -3.49755859375, -3.3603515625, -3.22314453125, -3.0859375, -2.94873046875, -2.8115234375, -2.67431640625, -2.537109375, -2.39990234375, -2.2626953125, -2.12548828125, -1.98828125, -1.85107421875, -1.7138671875, -1.57666015625, -1.439453125, -1.30224609375, -1.1650390625, -1.02783203125, -0.890625, -0.75341796875, -0.6162109375, -0.47900390625, -0.341796875, -0.20458984375, -0.0673828125, 0.06982421875, 0.20703125, 0.34423828125, 0.4814453125, 0.61865234375, 0.755859375, 0.89306640625, 1.0302734375, 1.16748046875, 1.3046875, 1.44189453125, 1.5791015625, 1.71630859375, 1.853515625, 1.99072265625, 2.1279296875, 2.26513671875, 2.40234375, 2.53955078125, 2.6767578125, 2.81396484375, 2.951171875, 3.08837890625, 3.2255859375, 3.36279296875, 3.5, 3.63720703125, 3.7744140625, 3.91162109375, 4.048828125, 4.18603515625, 4.3232421875, 4.46044921875, 4.59765625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 5.0, 1.0, 3.0, 8.0, 6.0, 5.0, 11.0, 15.0, 18.0, 18.0, 17.0, 21.0, 24.0, 35.0, 28.0, 41.0, 50.0, 30.0, 50.0, 56.0, 53.0, 57.0, 55.0, 51.0, 52.0, 50.0, 43.0, 33.0, 24.0, 32.0, 24.0, 22.0, 12.0, 14.0, 9.0, 9.0, 7.0, 0.0, 7.0, 2.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-7.3359375, -7.12139892578125, -6.9068603515625, -6.69232177734375, -6.477783203125, -6.26324462890625, -6.0487060546875, -5.83416748046875, -5.61962890625, -5.40509033203125, -5.1905517578125, -4.97601318359375, -4.761474609375, -4.54693603515625, -4.3323974609375, -4.11785888671875, -3.9033203125, -3.68878173828125, -3.4742431640625, -3.25970458984375, -3.045166015625, -2.83062744140625, -2.6160888671875, -2.40155029296875, -2.18701171875, -1.97247314453125, -1.7579345703125, -1.54339599609375, -1.328857421875, -1.11431884765625, -0.8997802734375, -0.68524169921875, -0.470703125, -0.25616455078125, -0.0416259765625, 0.17291259765625, 0.387451171875, 0.60198974609375, 0.8165283203125, 1.03106689453125, 1.24560546875, 1.46014404296875, 1.6746826171875, 1.88922119140625, 2.103759765625, 2.31829833984375, 2.5328369140625, 2.74737548828125, 2.9619140625, 3.17645263671875, 3.3909912109375, 3.60552978515625, 3.820068359375, 4.03460693359375, 4.2491455078125, 4.46368408203125, 4.67822265625, 4.89276123046875, 5.1072998046875, 5.32183837890625, 5.536376953125, 5.75091552734375, 5.9654541015625, 6.17999267578125, 6.39453125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 0.0, 4.0, 1.0, 3.0, 9.0, 15.0, 21.0, 24.0, 26.0, 42.0, 64.0, 98.0, 187.0, 268.0, 523.0, 1167.0, 3032.0, 9397.0, 42616.0, 351901.0, 549174.0, 69702.0, 13322.0, 3989.0, 1463.0, 665.0, 322.0, 195.0, 99.0, 75.0, 44.0, 30.0, 25.0, 15.0, 7.0, 12.0, 6.0, 4.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.265625, -2.1904296875, -2.115234375, -2.0400390625, -1.96484375, -1.8896484375, -1.814453125, -1.7392578125, -1.6640625, -1.5888671875, -1.513671875, -1.4384765625, -1.36328125, -1.2880859375, -1.212890625, -1.1376953125, -1.0625, -0.9873046875, -0.912109375, -0.8369140625, -0.76171875, -0.6865234375, -0.611328125, -0.5361328125, -0.4609375, -0.3857421875, -0.310546875, -0.2353515625, -0.16015625, -0.0849609375, -0.009765625, 0.0654296875, 0.140625, 0.2158203125, 0.291015625, 0.3662109375, 0.44140625, 0.5166015625, 0.591796875, 0.6669921875, 0.7421875, 0.8173828125, 0.892578125, 0.9677734375, 1.04296875, 1.1181640625, 1.193359375, 1.2685546875, 1.34375, 1.4189453125, 1.494140625, 1.5693359375, 1.64453125, 1.7197265625, 1.794921875, 1.8701171875, 1.9453125, 2.0205078125, 2.095703125, 2.1708984375, 2.24609375, 2.3212890625, 2.396484375, 2.4716796875, 2.546875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 12.0, 5.0, 18.0, 25.0, 40.0, 51.0, 51.0, 106.0, 124.0, 117.0, 111.0, 88.0, 74.0, 58.0, 40.0, 29.0, 9.0, 13.0, 5.0, 5.0, 6.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003104209899902344, -0.0002987682819366455, -0.00028711557388305664, -0.0002754628658294678, -0.0002638101577758789, -0.00025215744972229004, -0.00024050474166870117, -0.0002288520336151123, -0.00021719932556152344, -0.00020554661750793457, -0.0001938939094543457, -0.00018224120140075684, -0.00017058849334716797, -0.0001589357852935791, -0.00014728307723999023, -0.00013563036918640137, -0.0001239776611328125, -0.00011232495307922363, -0.00010067224502563477, -8.90195369720459e-05, -7.736682891845703e-05, -6.571412086486816e-05, -5.40614128112793e-05, -4.240870475769043e-05, -3.075599670410156e-05, -1.9103288650512695e-05, -7.450580596923828e-06, 4.202127456665039e-06, 1.5854835510253906e-05, 2.7507543563842773e-05, 3.916025161743164e-05, 5.081295967102051e-05, 6.246566772460938e-05, 7.411837577819824e-05, 8.577108383178711e-05, 9.742379188537598e-05, 0.00010907649993896484, 0.00012072920799255371, 0.00013238191604614258, 0.00014403462409973145, 0.0001556873321533203, 0.00016734004020690918, 0.00017899274826049805, 0.00019064545631408691, 0.00020229816436767578, 0.00021395087242126465, 0.00022560358047485352, 0.00023725628852844238, 0.00024890899658203125, 0.0002605617046356201, 0.000272214412689209, 0.00028386712074279785, 0.0002955198287963867, 0.0003071725368499756, 0.00031882524490356445, 0.0003304779529571533, 0.0003421306610107422, 0.00035378336906433105, 0.0003654360771179199, 0.0003770887851715088, 0.00038874149322509766, 0.0004003942012786865, 0.0004120469093322754, 0.00042369961738586426, 0.0004353523254394531]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 6.0, 5.0, 6.0, 9.0, 6.0, 28.0, 20.0, 59.0, 72.0, 72.0, 148.0, 220.0, 378.0, 653.0, 1270.0, 2626.0, 6430.0, 19761.0, 81436.0, 353747.0, 433874.0, 108305.0, 25332.0, 7790.0, 3013.0, 1451.0, 738.0, 389.0, 236.0, 143.0, 99.0, 62.0, 43.0, 38.0, 20.0, 21.0, 13.0, 6.0, 5.0, 7.0, 6.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.671875, -1.619781494140625, -1.56768798828125, -1.515594482421875, -1.4635009765625, -1.411407470703125, -1.35931396484375, -1.307220458984375, -1.255126953125, -1.203033447265625, -1.15093994140625, -1.098846435546875, -1.0467529296875, -0.994659423828125, -0.94256591796875, -0.890472412109375, -0.83837890625, -0.786285400390625, -0.73419189453125, -0.682098388671875, -0.6300048828125, -0.577911376953125, -0.52581787109375, -0.473724365234375, -0.421630859375, -0.369537353515625, -0.31744384765625, -0.265350341796875, -0.2132568359375, -0.161163330078125, -0.10906982421875, -0.056976318359375, -0.0048828125, 0.047210693359375, 0.09930419921875, 0.151397705078125, 0.2034912109375, 0.255584716796875, 0.30767822265625, 0.359771728515625, 0.411865234375, 0.463958740234375, 0.51605224609375, 0.568145751953125, 0.6202392578125, 0.672332763671875, 0.72442626953125, 0.776519775390625, 0.82861328125, 0.880706787109375, 0.93280029296875, 0.984893798828125, 1.0369873046875, 1.089080810546875, 1.14117431640625, 1.193267822265625, 1.245361328125, 1.297454833984375, 1.34954833984375, 1.401641845703125, 1.4537353515625, 1.505828857421875, 1.55792236328125, 1.610015869140625, 1.662109375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 5.0, 0.0, 9.0, 5.0, 14.0, 18.0, 31.0, 34.0, 52.0, 62.0, 84.0, 92.0, 128.0, 110.0, 111.0, 68.0, 55.0, 41.0, 28.0, 11.0, 10.0, 7.0, 8.0, 5.0, 5.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4375, -2.352203369140625, -2.26690673828125, -2.181610107421875, -2.0963134765625, -2.011016845703125, -1.92572021484375, -1.840423583984375, -1.755126953125, -1.669830322265625, -1.58453369140625, -1.499237060546875, -1.4139404296875, -1.328643798828125, -1.24334716796875, -1.158050537109375, -1.07275390625, -0.987457275390625, -0.90216064453125, -0.816864013671875, -0.7315673828125, -0.646270751953125, -0.56097412109375, -0.475677490234375, -0.390380859375, -0.305084228515625, -0.21978759765625, -0.134490966796875, -0.0491943359375, 0.036102294921875, 0.12139892578125, 0.206695556640625, 0.2919921875, 0.377288818359375, 0.46258544921875, 0.547882080078125, 0.6331787109375, 0.718475341796875, 0.80377197265625, 0.889068603515625, 0.974365234375, 1.059661865234375, 1.14495849609375, 1.230255126953125, 1.3155517578125, 1.400848388671875, 1.48614501953125, 1.571441650390625, 1.65673828125, 1.742034912109375, 1.82733154296875, 1.912628173828125, 1.9979248046875, 2.083221435546875, 2.16851806640625, 2.253814697265625, 2.339111328125, 2.424407958984375, 2.50970458984375, 2.595001220703125, 2.6802978515625, 2.765594482421875, 2.85089111328125, 2.936187744140625, 3.021484375]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 14.0, 28.0, 151.0, 348.0, 330.0, 103.0, 29.0, 5.0, 3.0, 2.0, 1.0, 1.0], "bins": [-182.0247039794922, -178.7698516845703, -175.51498413085938, -172.2601318359375, -169.00527954101562, -165.7504119873047, -162.4955596923828, -159.24070739746094, -155.98583984375, -152.73098754882812, -149.4761199951172, -146.2212677001953, -142.96641540527344, -139.7115478515625, -136.45669555664062, -133.20184326171875, -129.94699096679688, -126.69213104248047, -123.4372787475586, -120.18241882324219, -116.92755889892578, -113.6727066040039, -110.4178466796875, -107.16299438476562, -103.90812683105469, -100.65326690673828, -97.3984146118164, -94.1435546875, -90.8886947631836, -87.63384246826172, -84.37898254394531, -81.12413024902344, -77.8692626953125, -74.6144027709961, -71.35955047607422, -68.10469055175781, -64.8498306274414, -61.59497833251953, -58.340118408203125, -55.085262298583984, -51.830406188964844, -48.5755500793457, -45.3206901550293, -42.065834045410156, -38.810977935791016, -35.556121826171875, -32.30126190185547, -29.046405792236328, -25.791547775268555, -22.53668975830078, -19.28183364868164, -16.026975631713867, -12.77211856842041, -9.517261505126953, -6.26240348815918, -3.007547378540039, 0.24731063842773438, 3.5021679401397705, 6.757025241851807, 10.011882781982422, 13.266739845275879, 16.521596908569336, 19.77645492553711, 23.03131103515625, 26.286169052124023]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 1.0, 0.0, 2.0, 6.0, 3.0, 2.0, 6.0, 13.0, 8.0, 15.0, 18.0, 25.0, 21.0, 38.0, 44.0, 40.0, 45.0, 53.0, 51.0, 52.0, 50.0, 59.0, 58.0, 45.0, 52.0, 49.0, 45.0, 34.0, 33.0, 20.0, 25.0, 15.0, 12.0, 13.0, 12.0, 9.0, 6.0, 9.0, 8.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.51097106933594, -39.196617126464844, -37.88226318359375, -36.56790542602539, -35.2535514831543, -33.9391975402832, -32.62484359741211, -31.310489654541016, -29.99613380432129, -28.681779861450195, -27.36742401123047, -26.053070068359375, -24.73871612548828, -23.424360275268555, -22.11000633239746, -20.795650482177734, -19.48129653930664, -18.166942596435547, -16.85258674621582, -15.538232803344727, -14.223877906799316, -12.909523010253906, -11.595169067382812, -10.280814170837402, -8.966459274291992, -7.652104377746582, -6.33774995803833, -5.023395538330078, -3.709040641784668, -2.394685745239258, -1.0803313255310059, 0.2340230941772461, 1.5483779907226562, 2.8627326488494873, 4.177087306976318, 5.49144172668457, 6.8057966232299805, 8.12015151977539, 9.434505462646484, 10.748860359191895, 12.063215255737305, 13.377570152282715, 14.691925048828125, 16.00627899169922, 17.320632934570312, 18.63498878479004, 19.949342727661133, 21.26369857788086, 22.578052520751953, 23.892406463623047, 25.206762313842773, 26.521116256713867, 27.835472106933594, 29.149826049804688, 30.46417999267578, 31.778533935546875, 33.09288787841797, 34.40724182128906, 35.721595764160156, 37.035953521728516, 38.35030746459961, 39.6646614074707, 40.9790153503418, 42.29336929321289, 43.60772705078125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 5.0, 2.0, 6.0, 6.0, 3.0, 4.0, 12.0, 23.0, 20.0, 28.0, 55.0, 78.0, 174.0, 273.0, 587.0, 1568.0, 4684.0, 21416.0, 4036986.0, 112457.0, 10980.0, 2911.0, 1039.0, 474.0, 212.0, 111.0, 66.0, 41.0, 21.0, 9.0, 13.0, 5.0, 6.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.734375, -11.4239501953125, -11.113525390625, -10.8031005859375, -10.49267578125, -10.1822509765625, -9.871826171875, -9.5614013671875, -9.2509765625, -8.9405517578125, -8.630126953125, -8.3197021484375, -8.00927734375, -7.6988525390625, -7.388427734375, -7.0780029296875, -6.767578125, -6.4571533203125, -6.146728515625, -5.8363037109375, -5.52587890625, -5.2154541015625, -4.905029296875, -4.5946044921875, -4.2841796875, -3.9737548828125, -3.663330078125, -3.3529052734375, -3.04248046875, -2.7320556640625, -2.421630859375, -2.1112060546875, -1.80078125, -1.4903564453125, -1.179931640625, -0.8695068359375, -0.55908203125, -0.2486572265625, 0.061767578125, 0.3721923828125, 0.6826171875, 0.9930419921875, 1.303466796875, 1.6138916015625, 1.92431640625, 2.2347412109375, 2.545166015625, 2.8555908203125, 3.166015625, 3.4764404296875, 3.786865234375, 4.0972900390625, 4.40771484375, 4.7181396484375, 5.028564453125, 5.3389892578125, 5.6494140625, 5.9598388671875, 6.270263671875, 6.5806884765625, 6.89111328125, 7.2015380859375, 7.511962890625, 7.8223876953125, 8.1328125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 7.0, 7.0, 8.0, 8.0, 17.0, 20.0, 15.0, 26.0, 27.0, 39.0, 31.0, 55.0, 55.0, 55.0, 51.0, 41.0, 54.0, 57.0, 33.0, 42.0, 57.0, 48.0, 47.0, 34.0, 33.0, 19.0, 26.0, 19.0, 24.0, 4.0, 8.0, 7.0, 5.0, 3.0, 3.0, 3.0, 1.0, 4.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.021484375, -1.9661102294921875, -1.910736083984375, -1.8553619384765625, -1.79998779296875, -1.7446136474609375, -1.689239501953125, -1.6338653564453125, -1.5784912109375, -1.5231170654296875, -1.467742919921875, -1.4123687744140625, -1.35699462890625, -1.3016204833984375, -1.246246337890625, -1.1908721923828125, -1.135498046875, -1.0801239013671875, -1.024749755859375, -0.9693756103515625, -0.91400146484375, -0.8586273193359375, -0.803253173828125, -0.7478790283203125, -0.6925048828125, -0.6371307373046875, -0.581756591796875, -0.5263824462890625, -0.47100830078125, -0.4156341552734375, -0.360260009765625, -0.3048858642578125, -0.24951171875, -0.1941375732421875, -0.138763427734375, -0.0833892822265625, -0.02801513671875, 0.0273590087890625, 0.082733154296875, 0.1381072998046875, 0.1934814453125, 0.2488555908203125, 0.304229736328125, 0.3596038818359375, 0.41497802734375, 0.4703521728515625, 0.525726318359375, 0.5811004638671875, 0.636474609375, 0.6918487548828125, 0.747222900390625, 0.8025970458984375, 0.85797119140625, 0.9133453369140625, 0.968719482421875, 1.0240936279296875, 1.0794677734375, 1.1348419189453125, 1.190216064453125, 1.2455902099609375, 1.30096435546875, 1.3563385009765625, 1.411712646484375, 1.4670867919921875, 1.5224609375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 5.0, 5.0, 5.0, 2.0, 8.0, 20.0, 29.0, 36.0, 51.0, 74.0, 107.0, 179.0, 251.0, 403.0, 590.0, 980.0, 1685.0, 3300.0, 7583.0, 21100.0, 107061.0, 3931740.0, 86680.0, 18406.0, 6771.0, 2916.0, 1579.0, 948.0, 565.0, 389.0, 260.0, 156.0, 113.0, 79.0, 68.0, 40.0, 24.0, 26.0, 14.0, 8.0, 6.0, 10.0, 7.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.96875, -4.80560302734375, -4.6424560546875, -4.47930908203125, -4.316162109375, -4.15301513671875, -3.9898681640625, -3.82672119140625, -3.66357421875, -3.50042724609375, -3.3372802734375, -3.17413330078125, -3.010986328125, -2.84783935546875, -2.6846923828125, -2.52154541015625, -2.3583984375, -2.19525146484375, -2.0321044921875, -1.86895751953125, -1.705810546875, -1.54266357421875, -1.3795166015625, -1.21636962890625, -1.05322265625, -0.89007568359375, -0.7269287109375, -0.56378173828125, -0.400634765625, -0.23748779296875, -0.0743408203125, 0.08880615234375, 0.251953125, 0.41510009765625, 0.5782470703125, 0.74139404296875, 0.904541015625, 1.06768798828125, 1.2308349609375, 1.39398193359375, 1.55712890625, 1.72027587890625, 1.8834228515625, 2.04656982421875, 2.209716796875, 2.37286376953125, 2.5360107421875, 2.69915771484375, 2.8623046875, 3.02545166015625, 3.1885986328125, 3.35174560546875, 3.514892578125, 3.67803955078125, 3.8411865234375, 4.00433349609375, 4.16748046875, 4.33062744140625, 4.4937744140625, 4.65692138671875, 4.820068359375, 4.98321533203125, 5.1463623046875, 5.30950927734375, 5.47265625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 3.0, 13.0, 13.0, 20.0, 27.0, 46.0, 104.0, 617.0, 3016.0, 100.0, 50.0, 22.0, 11.0, 7.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2236328125, -1.1728057861328125, -1.121978759765625, -1.0711517333984375, -1.02032470703125, -0.9694976806640625, -0.918670654296875, -0.8678436279296875, -0.8170166015625, -0.7661895751953125, -0.715362548828125, -0.6645355224609375, -0.61370849609375, -0.5628814697265625, -0.512054443359375, -0.4612274169921875, -0.410400390625, -0.3595733642578125, -0.308746337890625, -0.2579193115234375, -0.20709228515625, -0.1562652587890625, -0.105438232421875, -0.0546112060546875, -0.0037841796875, 0.0470428466796875, 0.097869873046875, 0.1486968994140625, 0.19952392578125, 0.2503509521484375, 0.301177978515625, 0.3520050048828125, 0.40283203125, 0.4536590576171875, 0.504486083984375, 0.5553131103515625, 0.60614013671875, 0.6569671630859375, 0.707794189453125, 0.7586212158203125, 0.8094482421875, 0.8602752685546875, 0.911102294921875, 0.9619293212890625, 1.01275634765625, 1.0635833740234375, 1.114410400390625, 1.1652374267578125, 1.216064453125, 1.2668914794921875, 1.317718505859375, 1.3685455322265625, 1.41937255859375, 1.4701995849609375, 1.521026611328125, 1.5718536376953125, 1.6226806640625, 1.6735076904296875, 1.724334716796875, 1.7751617431640625, 1.82598876953125, 1.8768157958984375, 1.927642822265625, 1.9784698486328125, 2.029296875]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 3.0, 8.0, 12.0, 27.0, 45.0, 97.0, 165.0, 239.0, 198.0, 137.0, 63.0, 9.0, 7.0, 3.0, 2.0], "bins": [-15.506940841674805, -15.235616683959961, -14.9642915725708, -14.69296646118164, -14.421642303466797, -14.150318145751953, -13.878993034362793, -13.607667922973633, -13.336343765258789, -13.065019607543945, -12.793694496154785, -12.522369384765625, -12.251045227050781, -11.979721069335938, -11.708395957946777, -11.437070846557617, -11.165746688842773, -10.89442253112793, -10.62309741973877, -10.35177230834961, -10.080448150634766, -9.809123992919922, -9.537798881530762, -9.266473770141602, -8.995149612426758, -8.723825454711914, -8.452500343322754, -8.181175231933594, -7.90985107421875, -7.638526439666748, -7.367201805114746, -7.095877170562744, -6.824552059173584, -6.553227424621582, -6.28190279006958, -6.010578155517578, -5.739253520965576, -5.467928886413574, -5.196604251861572, -4.92527961730957, -4.653954982757568, -4.382630348205566, -4.1113057136535645, -3.8399810791015625, -3.5686564445495605, -3.2973318099975586, -3.0260071754455566, -2.7546825408935547, -2.4833579063415527, -2.212033271789551, -1.9407086372375488, -1.6693840026855469, -1.398059368133545, -1.126734733581543, -0.855410099029541, -0.5840854644775391, -0.3127608299255371, -0.041436195373535156, 0.2298884391784668, 0.5012130737304688, 0.7725377082824707, 1.0438623428344727, 1.3151869773864746, 1.5865116119384766, 1.8578362464904785]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 2.0, 4.0, 1.0, 4.0, 7.0, 8.0, 7.0, 8.0, 15.0, 16.0, 15.0, 22.0, 27.0, 25.0, 22.0, 32.0, 30.0, 36.0, 28.0, 29.0, 38.0, 31.0, 29.0, 31.0, 42.0, 45.0, 31.0, 41.0, 42.0, 42.0, 42.0, 28.0, 26.0, 35.0, 19.0, 20.0, 11.0, 20.0, 22.0, 12.0, 13.0, 8.0, 7.0, 8.0, 7.0, 7.0, 5.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-2.7228174209594727, -2.630297899246216, -2.537778377532959, -2.4452590942382812, -2.3527395725250244, -2.2602200508117676, -2.1677005290985107, -2.075181007385254, -1.9826616048812866, -1.8901420831680298, -1.7976226806640625, -1.7051031589508057, -1.6125836372375488, -1.5200642347335815, -1.4275447130203247, -1.3350253105163574, -1.2425057888031006, -1.1499862670898438, -1.0574668645858765, -0.9649473428726196, -0.8724278807640076, -0.7799084186553955, -0.6873888969421387, -0.5948694348335266, -0.5023499727249146, -0.4098305106163025, -0.31731101870536804, -0.2247915267944336, -0.13227206468582153, -0.03975260257720947, 0.05276691913604736, 0.14528638124465942, 0.23780584335327148, 0.33032530546188354, 0.422844797372818, 0.5153642892837524, 0.6078837513923645, 0.7004032135009766, 0.7929227352142334, 0.8854421973228455, 0.9779616594314575, 1.0704811811447144, 1.1630005836486816, 1.2555201053619385, 1.3480396270751953, 1.4405590295791626, 1.5330785512924194, 1.6255979537963867, 1.7181174755096436, 1.8106369972229004, 1.9031563997268677, 1.9956759214401245, 2.088195323944092, 2.1807148456573486, 2.2732343673706055, 2.3657538890838623, 2.458273410797119, 2.550792932510376, 2.643312454223633, 2.7358317375183105, 2.8283512592315674, 2.920870780944824, 3.013390302658081, 3.105909824371338, 3.1984291076660156]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 7.0, 12.0, 13.0, 26.0, 30.0, 59.0, 99.0, 198.0, 488.0, 1133.0, 3154.0, 10739.0, 43677.0, 200392.0, 506163.0, 217457.0, 47675.0, 11597.0, 3460.0, 1225.0, 474.0, 204.0, 120.0, 55.0, 42.0, 20.0, 11.0, 9.0, 6.0, 9.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1484375, -3.96429443359375, -3.7801513671875, -3.59600830078125, -3.411865234375, -3.22772216796875, -3.0435791015625, -2.85943603515625, -2.67529296875, -2.49114990234375, -2.3070068359375, -2.12286376953125, -1.938720703125, -1.75457763671875, -1.5704345703125, -1.38629150390625, -1.2021484375, -1.01800537109375, -0.8338623046875, -0.64971923828125, -0.465576171875, -0.28143310546875, -0.0972900390625, 0.08685302734375, 0.27099609375, 0.45513916015625, 0.6392822265625, 0.82342529296875, 1.007568359375, 1.19171142578125, 1.3758544921875, 1.55999755859375, 1.744140625, 1.92828369140625, 2.1124267578125, 2.29656982421875, 2.480712890625, 2.66485595703125, 2.8489990234375, 3.03314208984375, 3.21728515625, 3.40142822265625, 3.5855712890625, 3.76971435546875, 3.953857421875, 4.13800048828125, 4.3221435546875, 4.50628662109375, 4.6904296875, 4.87457275390625, 5.0587158203125, 5.24285888671875, 5.427001953125, 5.61114501953125, 5.7952880859375, 5.97943115234375, 6.16357421875, 6.34771728515625, 6.5318603515625, 6.71600341796875, 6.900146484375, 7.08428955078125, 7.2684326171875, 7.45257568359375, 7.63671875]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 2.0, 2.0, 7.0, 2.0, 7.0, 4.0, 9.0, 13.0, 16.0, 12.0, 23.0, 18.0, 26.0, 40.0, 43.0, 44.0, 41.0, 45.0, 55.0, 52.0, 51.0, 59.0, 43.0, 43.0, 54.0, 43.0, 37.0, 36.0, 36.0, 26.0, 29.0, 19.0, 18.0, 10.0, 9.0, 8.0, 8.0, 7.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.037109375, -1.97845458984375, -1.9197998046875, -1.86114501953125, -1.802490234375, -1.74383544921875, -1.6851806640625, -1.62652587890625, -1.56787109375, -1.50921630859375, -1.4505615234375, -1.39190673828125, -1.333251953125, -1.27459716796875, -1.2159423828125, -1.15728759765625, -1.0986328125, -1.03997802734375, -0.9813232421875, -0.92266845703125, -0.864013671875, -0.80535888671875, -0.7467041015625, -0.68804931640625, -0.62939453125, -0.57073974609375, -0.5120849609375, -0.45343017578125, -0.394775390625, -0.33612060546875, -0.2774658203125, -0.21881103515625, -0.16015625, -0.10150146484375, -0.0428466796875, 0.01580810546875, 0.074462890625, 0.13311767578125, 0.1917724609375, 0.25042724609375, 0.30908203125, 0.36773681640625, 0.4263916015625, 0.48504638671875, 0.543701171875, 0.60235595703125, 0.6610107421875, 0.71966552734375, 0.7783203125, 0.83697509765625, 0.8956298828125, 0.95428466796875, 1.012939453125, 1.07159423828125, 1.1302490234375, 1.18890380859375, 1.24755859375, 1.30621337890625, 1.3648681640625, 1.42352294921875, 1.482177734375, 1.54083251953125, 1.5994873046875, 1.65814208984375, 1.716796875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 6.0, 3.0, 3.0, 5.0, 9.0, 14.0, 14.0, 28.0, 26.0, 46.0, 73.0, 73.0, 149.0, 249.0, 471.0, 1070.0, 2916.0, 10023.0, 50844.0, 348329.0, 531400.0, 81313.0, 14841.0, 3900.0, 1346.0, 563.0, 301.0, 188.0, 108.0, 71.0, 55.0, 43.0, 24.0, 19.0, 10.0, 4.0, 7.0, 4.0, 3.0, 4.0, 3.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.78125, -6.56341552734375, -6.3455810546875, -6.12774658203125, -5.909912109375, -5.69207763671875, -5.4742431640625, -5.25640869140625, -5.03857421875, -4.82073974609375, -4.6029052734375, -4.38507080078125, -4.167236328125, -3.94940185546875, -3.7315673828125, -3.51373291015625, -3.2958984375, -3.07806396484375, -2.8602294921875, -2.64239501953125, -2.424560546875, -2.20672607421875, -1.9888916015625, -1.77105712890625, -1.55322265625, -1.33538818359375, -1.1175537109375, -0.89971923828125, -0.681884765625, -0.46405029296875, -0.2462158203125, -0.02838134765625, 0.189453125, 0.40728759765625, 0.6251220703125, 0.84295654296875, 1.060791015625, 1.27862548828125, 1.4964599609375, 1.71429443359375, 1.93212890625, 2.14996337890625, 2.3677978515625, 2.58563232421875, 2.803466796875, 3.02130126953125, 3.2391357421875, 3.45697021484375, 3.6748046875, 3.89263916015625, 4.1104736328125, 4.32830810546875, 4.546142578125, 4.76397705078125, 4.9818115234375, 5.19964599609375, 5.41748046875, 5.63531494140625, 5.8531494140625, 6.07098388671875, 6.288818359375, 6.50665283203125, 6.7244873046875, 6.94232177734375, 7.16015625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 3.0, 7.0, 9.0, 16.0, 20.0, 30.0, 37.0, 50.0, 37.0, 59.0, 50.0, 68.0, 63.0, 83.0, 80.0, 61.0, 66.0, 53.0, 51.0, 34.0, 24.0, 29.0, 25.0, 9.0, 9.0, 7.0, 5.0, 5.0, 3.0, 1.0, 9.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.421875, -8.963623046875, -8.50537109375, -8.047119140625, -7.5888671875, -7.130615234375, -6.67236328125, -6.214111328125, -5.755859375, -5.297607421875, -4.83935546875, -4.381103515625, -3.9228515625, -3.464599609375, -3.00634765625, -2.548095703125, -2.08984375, -1.631591796875, -1.17333984375, -0.715087890625, -0.2568359375, 0.201416015625, 0.65966796875, 1.117919921875, 1.576171875, 2.034423828125, 2.49267578125, 2.950927734375, 3.4091796875, 3.867431640625, 4.32568359375, 4.783935546875, 5.2421875, 5.700439453125, 6.15869140625, 6.616943359375, 7.0751953125, 7.533447265625, 7.99169921875, 8.449951171875, 8.908203125, 9.366455078125, 9.82470703125, 10.282958984375, 10.7412109375, 11.199462890625, 11.65771484375, 12.115966796875, 12.57421875, 13.032470703125, 13.49072265625, 13.948974609375, 14.4072265625, 14.865478515625, 15.32373046875, 15.781982421875, 16.240234375, 16.698486328125, 17.15673828125, 17.614990234375, 18.0732421875, 18.531494140625, 18.98974609375, 19.447998046875, 19.90625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 4.0, 9.0, 12.0, 12.0, 40.0, 74.0, 144.0, 375.0, 1302.0, 11043.0, 1007979.0, 24841.0, 1897.0, 470.0, 176.0, 83.0, 42.0, 21.0, 15.0, 7.0, 6.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.40625, -9.9998779296875, -9.593505859375, -9.1871337890625, -8.78076171875, -8.3743896484375, -7.968017578125, -7.5616455078125, -7.1552734375, -6.7489013671875, -6.342529296875, -5.9361572265625, -5.52978515625, -5.1234130859375, -4.717041015625, -4.3106689453125, -3.904296875, -3.4979248046875, -3.091552734375, -2.6851806640625, -2.27880859375, -1.8724365234375, -1.466064453125, -1.0596923828125, -0.6533203125, -0.2469482421875, 0.159423828125, 0.5657958984375, 0.97216796875, 1.3785400390625, 1.784912109375, 2.1912841796875, 2.59765625, 3.0040283203125, 3.410400390625, 3.8167724609375, 4.22314453125, 4.6295166015625, 5.035888671875, 5.4422607421875, 5.8486328125, 6.2550048828125, 6.661376953125, 7.0677490234375, 7.47412109375, 7.8804931640625, 8.286865234375, 8.6932373046875, 9.099609375, 9.5059814453125, 9.912353515625, 10.3187255859375, 10.72509765625, 11.1314697265625, 11.537841796875, 11.9442138671875, 12.3505859375, 12.7569580078125, 13.163330078125, 13.5697021484375, 13.97607421875, 14.3824462890625, 14.788818359375, 15.1951904296875, 15.6015625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 10.0, 15.0, 17.0, 44.0, 69.0, 87.0, 143.0, 178.0, 172.0, 106.0, 74.0, 32.0, 21.0, 11.0, 9.0, 4.0, 7.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007047653198242188, -0.000681854784488678, -0.0006589442491531372, -0.0006360337138175964, -0.0006131231784820557, -0.0005902126431465149, -0.0005673021078109741, -0.0005443915724754333, -0.0005214810371398926, -0.0004985705018043518, -0.00047565996646881104, -0.00045274943113327026, -0.0004298388957977295, -0.0004069283604621887, -0.00038401782512664795, -0.0003611072897911072, -0.0003381967544555664, -0.00031528621912002563, -0.00029237568378448486, -0.0002694651484489441, -0.0002465546131134033, -0.00022364407777786255, -0.00020073354244232178, -0.000177823007106781, -0.00015491247177124023, -0.00013200193643569946, -0.00010909140110015869, -8.618086576461792e-05, -6.327033042907715e-05, -4.035979509353638e-05, -1.7449259757995605e-05, 5.461275577545166e-06, 2.8371810913085938e-05, 5.128234624862671e-05, 7.419288158416748e-05, 9.710341691970825e-05, 0.00012001395225524902, 0.0001429244875907898, 0.00016583502292633057, 0.00018874555826187134, 0.0002116560935974121, 0.00023456662893295288, 0.00025747716426849365, 0.0002803876996040344, 0.0003032982349395752, 0.00032620877027511597, 0.00034911930561065674, 0.0003720298409461975, 0.0003949403762817383, 0.00041785091161727905, 0.0004407614469528198, 0.0004636719822883606, 0.00048658251762390137, 0.0005094930529594421, 0.0005324035882949829, 0.0005553141236305237, 0.0005782246589660645, 0.0006011351943016052, 0.000624045729637146, 0.0006469562649726868, 0.0006698668003082275, 0.0006927773356437683, 0.0007156878709793091, 0.0007385984063148499, 0.0007615089416503906]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 5.0, 3.0, 13.0, 14.0, 33.0, 48.0, 116.0, 213.0, 578.0, 1553.0, 5818.0, 56257.0, 898065.0, 76184.0, 6777.0, 1791.0, 634.0, 234.0, 103.0, 54.0, 21.0, 18.0, 10.0, 6.0, 4.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.86328125, -3.6839599609375, -3.504638671875, -3.3253173828125, -3.14599609375, -2.9666748046875, -2.787353515625, -2.6080322265625, -2.4287109375, -2.2493896484375, -2.070068359375, -1.8907470703125, -1.71142578125, -1.5321044921875, -1.352783203125, -1.1734619140625, -0.994140625, -0.8148193359375, -0.635498046875, -0.4561767578125, -0.27685546875, -0.0975341796875, 0.081787109375, 0.2611083984375, 0.4404296875, 0.6197509765625, 0.799072265625, 0.9783935546875, 1.15771484375, 1.3370361328125, 1.516357421875, 1.6956787109375, 1.875, 2.0543212890625, 2.233642578125, 2.4129638671875, 2.59228515625, 2.7716064453125, 2.950927734375, 3.1302490234375, 3.3095703125, 3.4888916015625, 3.668212890625, 3.8475341796875, 4.02685546875, 4.2061767578125, 4.385498046875, 4.5648193359375, 4.744140625, 4.9234619140625, 5.102783203125, 5.2821044921875, 5.46142578125, 5.6407470703125, 5.820068359375, 5.9993896484375, 6.1787109375, 6.3580322265625, 6.537353515625, 6.7166748046875, 6.89599609375, 7.0753173828125, 7.254638671875, 7.4339599609375, 7.61328125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 3.0, 3.0, 5.0, 6.0, 12.0, 20.0, 33.0, 77.0, 158.0, 245.0, 216.0, 102.0, 68.0, 21.0, 12.0, 7.0, 2.0, 5.0, 4.0, 1.0, 1.0, 0.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.5390625, -8.3128662109375, -8.086669921875, -7.8604736328125, -7.63427734375, -7.4080810546875, -7.181884765625, -6.9556884765625, -6.7294921875, -6.5032958984375, -6.277099609375, -6.0509033203125, -5.82470703125, -5.5985107421875, -5.372314453125, -5.1461181640625, -4.919921875, -4.6937255859375, -4.467529296875, -4.2413330078125, -4.01513671875, -3.7889404296875, -3.562744140625, -3.3365478515625, -3.1103515625, -2.8841552734375, -2.657958984375, -2.4317626953125, -2.20556640625, -1.9793701171875, -1.753173828125, -1.5269775390625, -1.30078125, -1.0745849609375, -0.848388671875, -0.6221923828125, -0.39599609375, -0.1697998046875, 0.056396484375, 0.2825927734375, 0.5087890625, 0.7349853515625, 0.961181640625, 1.1873779296875, 1.41357421875, 1.6397705078125, 1.865966796875, 2.0921630859375, 2.318359375, 2.5445556640625, 2.770751953125, 2.9969482421875, 3.22314453125, 3.4493408203125, 3.675537109375, 3.9017333984375, 4.1279296875, 4.3541259765625, 4.580322265625, 4.8065185546875, 5.03271484375, 5.2589111328125, 5.485107421875, 5.7113037109375, 5.9375]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 13.0, 31.0, 65.0, 102.0, 171.0, 206.0, 186.0, 121.0, 52.0, 33.0, 13.0, 9.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.882904052734375, -61.46776580810547, -59.05262756347656, -56.63749313354492, -54.222354888916016, -51.80721664428711, -49.39208221435547, -46.97694396972656, -44.561805725097656, -42.14666748046875, -39.731529235839844, -37.3163948059082, -34.9012565612793, -32.48611831665039, -30.070981979370117, -27.655845642089844, -25.240707397460938, -22.82556915283203, -20.410432815551758, -17.995296478271484, -15.580158233642578, -13.165020942687988, -10.749883651733398, -8.334747314453125, -5.919609069824219, -3.504471778869629, -1.089334487915039, 1.3258028030395508, 3.7409400939941406, 6.1560773849487305, 8.57121467590332, 10.986351013183594, 13.4014892578125, 15.81662654876709, 18.23176383972168, 20.646900177001953, 23.06203842163086, 25.477176666259766, 27.89231300354004, 30.307449340820312, 32.72258758544922, 35.137725830078125, 37.55286407470703, 39.96799850463867, 42.38313674926758, 44.798274993896484, 47.213409423828125, 49.62854766845703, 52.04368591308594, 54.458824157714844, 56.87396240234375, 59.28909683227539, 61.7042350769043, 64.11936950683594, 66.53450775146484, 68.94964599609375, 71.36478424072266, 73.77992248535156, 76.19506072998047, 78.61019897460938, 81.02532958984375, 83.44046783447266, 85.85560607910156, 88.27074432373047, 90.68588256835938]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 8.0, 7.0, 7.0, 8.0, 10.0, 12.0, 16.0, 21.0, 17.0, 16.0, 32.0, 18.0, 42.0, 26.0, 40.0, 49.0, 45.0, 50.0, 62.0, 56.0, 45.0, 72.0, 46.0, 40.0, 43.0, 37.0, 34.0, 28.0, 18.0, 20.0, 9.0, 15.0, 14.0, 9.0, 5.0, 11.0, 2.0, 4.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.304649353027344, -46.701942443847656, -45.099239349365234, -43.49653244018555, -41.89382553100586, -40.29112243652344, -38.68841552734375, -37.08570861816406, -35.483001708984375, -33.88029479980469, -32.277591705322266, -30.674884796142578, -29.07217788696289, -27.469472885131836, -25.86676788330078, -24.264060974121094, -22.661357879638672, -21.058652877807617, -19.45594596862793, -17.853240966796875, -16.250534057617188, -14.647829055786133, -13.045124053955078, -11.442418098449707, -9.839712142944336, -8.237006187438965, -6.634300708770752, -5.031595230102539, -3.428889274597168, -1.8261833190917969, -0.2234783172607422, 1.379227638244629, 2.98193359375, 4.584639549255371, 6.187345027923584, 7.790050506591797, 9.392756462097168, 10.995462417602539, 12.598167419433594, 14.200873374938965, 15.803579330444336, 17.40628433227539, 19.008991241455078, 20.611696243286133, 22.214401245117188, 23.817108154296875, 25.41981315612793, 27.022518157958984, 28.625225067138672, 30.227930068969727, 31.830636978149414, 33.43334197998047, 35.036048889160156, 36.638755798339844, 38.241458892822266, 39.84416580200195, 41.446868896484375, 43.04957580566406, 44.652278900146484, 46.25498580932617, 47.85769271850586, 49.46039581298828, 51.06310272216797, 52.665809631347656, 54.268516540527344]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 7.0, 2.0, 7.0, 7.0, 7.0, 7.0, 20.0, 18.0, 26.0, 22.0, 33.0, 79.0, 101.0, 140.0, 238.0, 372.0, 702.0, 1388.0, 3089.0, 8263.0, 31888.0, 3951734.0, 166322.0, 19150.0, 5782.0, 2449.0, 1091.0, 588.0, 317.0, 175.0, 91.0, 57.0, 39.0, 31.0, 14.0, 14.0, 6.0, 5.0, 7.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.09375, -7.86785888671875, -7.6419677734375, -7.41607666015625, -7.190185546875, -6.96429443359375, -6.7384033203125, -6.51251220703125, -6.28662109375, -6.06072998046875, -5.8348388671875, -5.60894775390625, -5.383056640625, -5.15716552734375, -4.9312744140625, -4.70538330078125, -4.4794921875, -4.25360107421875, -4.0277099609375, -3.80181884765625, -3.575927734375, -3.35003662109375, -3.1241455078125, -2.89825439453125, -2.67236328125, -2.44647216796875, -2.2205810546875, -1.99468994140625, -1.768798828125, -1.54290771484375, -1.3170166015625, -1.09112548828125, -0.865234375, -0.63934326171875, -0.4134521484375, -0.18756103515625, 0.038330078125, 0.26422119140625, 0.4901123046875, 0.71600341796875, 0.94189453125, 1.16778564453125, 1.3936767578125, 1.61956787109375, 1.845458984375, 2.07135009765625, 2.2972412109375, 2.52313232421875, 2.7490234375, 2.97491455078125, 3.2008056640625, 3.42669677734375, 3.652587890625, 3.87847900390625, 4.1043701171875, 4.33026123046875, 4.55615234375, 4.78204345703125, 5.0079345703125, 5.23382568359375, 5.459716796875, 5.68560791015625, 5.9114990234375, 6.13739013671875, 6.36328125]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 11.0, 7.0, 6.0, 8.0, 17.0, 24.0, 24.0, 31.0, 41.0, 45.0, 63.0, 58.0, 67.0, 80.0, 67.0, 54.0, 53.0, 61.0, 63.0, 38.0, 35.0, 37.0, 21.0, 17.0, 15.0, 12.0, 14.0, 6.0, 5.0, 2.0, 3.0, 0.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.654296875, -2.57440185546875, -2.4945068359375, -2.41461181640625, -2.334716796875, -2.25482177734375, -2.1749267578125, -2.09503173828125, -2.01513671875, -1.93524169921875, -1.8553466796875, -1.77545166015625, -1.695556640625, -1.61566162109375, -1.5357666015625, -1.45587158203125, -1.3759765625, -1.29608154296875, -1.2161865234375, -1.13629150390625, -1.056396484375, -0.97650146484375, -0.8966064453125, -0.81671142578125, -0.73681640625, -0.65692138671875, -0.5770263671875, -0.49713134765625, -0.417236328125, -0.33734130859375, -0.2574462890625, -0.17755126953125, -0.09765625, -0.01776123046875, 0.0621337890625, 0.14202880859375, 0.221923828125, 0.30181884765625, 0.3817138671875, 0.46160888671875, 0.54150390625, 0.62139892578125, 0.7012939453125, 0.78118896484375, 0.861083984375, 0.94097900390625, 1.0208740234375, 1.10076904296875, 1.1806640625, 1.26055908203125, 1.3404541015625, 1.42034912109375, 1.500244140625, 1.58013916015625, 1.6600341796875, 1.73992919921875, 1.81982421875, 1.89971923828125, 1.9796142578125, 2.05950927734375, 2.139404296875, 2.21929931640625, 2.2991943359375, 2.37908935546875, 2.458984375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 8.0, 8.0, 14.0, 12.0, 15.0, 28.0, 49.0, 40.0, 72.0, 94.0, 109.0, 163.0, 222.0, 292.0, 419.0, 592.0, 959.0, 1579.0, 2812.0, 5242.0, 11080.0, 27956.0, 115780.0, 3822055.0, 146919.0, 32301.0, 11869.0, 5735.0, 2949.0, 1696.0, 978.0, 621.0, 435.0, 311.0, 213.0, 154.0, 113.0, 101.0, 61.0, 54.0, 49.0, 34.0, 23.0, 12.0, 16.0, 12.0, 12.0, 9.0, 2.0, 7.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.8984375, -4.73272705078125, -4.5670166015625, -4.40130615234375, -4.235595703125, -4.06988525390625, -3.9041748046875, -3.73846435546875, -3.57275390625, -3.40704345703125, -3.2413330078125, -3.07562255859375, -2.909912109375, -2.74420166015625, -2.5784912109375, -2.41278076171875, -2.2470703125, -2.08135986328125, -1.9156494140625, -1.74993896484375, -1.584228515625, -1.41851806640625, -1.2528076171875, -1.08709716796875, -0.92138671875, -0.75567626953125, -0.5899658203125, -0.42425537109375, -0.258544921875, -0.09283447265625, 0.0728759765625, 0.23858642578125, 0.404296875, 0.57000732421875, 0.7357177734375, 0.90142822265625, 1.067138671875, 1.23284912109375, 1.3985595703125, 1.56427001953125, 1.72998046875, 1.89569091796875, 2.0614013671875, 2.22711181640625, 2.392822265625, 2.55853271484375, 2.7242431640625, 2.88995361328125, 3.0556640625, 3.22137451171875, 3.3870849609375, 3.55279541015625, 3.718505859375, 3.88421630859375, 4.0499267578125, 4.21563720703125, 4.38134765625, 4.54705810546875, 4.7127685546875, 4.87847900390625, 5.044189453125, 5.20989990234375, 5.3756103515625, 5.54132080078125, 5.70703125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 10.0, 11.0, 20.0, 22.0, 43.0, 95.0, 332.0, 3253.0, 146.0, 61.0, 32.0, 20.0, 8.0, 6.0, 2.0, 4.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.15234375, -3.067718505859375, -2.98309326171875, -2.898468017578125, -2.8138427734375, -2.729217529296875, -2.64459228515625, -2.559967041015625, -2.475341796875, -2.390716552734375, -2.30609130859375, -2.221466064453125, -2.1368408203125, -2.052215576171875, -1.96759033203125, -1.882965087890625, -1.79833984375, -1.713714599609375, -1.62908935546875, -1.544464111328125, -1.4598388671875, -1.375213623046875, -1.29058837890625, -1.205963134765625, -1.121337890625, -1.036712646484375, -0.95208740234375, -0.867462158203125, -0.7828369140625, -0.698211669921875, -0.61358642578125, -0.528961181640625, -0.4443359375, -0.359710693359375, -0.27508544921875, -0.190460205078125, -0.1058349609375, -0.021209716796875, 0.06341552734375, 0.148040771484375, 0.232666015625, 0.317291259765625, 0.40191650390625, 0.486541748046875, 0.5711669921875, 0.655792236328125, 0.74041748046875, 0.825042724609375, 0.90966796875, 0.994293212890625, 1.07891845703125, 1.163543701171875, 1.2481689453125, 1.332794189453125, 1.41741943359375, 1.502044677734375, 1.586669921875, 1.671295166015625, 1.75592041015625, 1.840545654296875, 1.9251708984375, 2.009796142578125, 2.09442138671875, 2.179046630859375, 2.263671875]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 8.0, 17.0, 22.0, 48.0, 96.0, 130.0, 187.0, 162.0, 144.0, 98.0, 48.0, 31.0, 12.0, 4.0, 1.0, 2.0, 1.0, 1.0], "bins": [-18.860492706298828, -18.50800895690918, -18.15552520751953, -17.803041458129883, -17.450557708740234, -17.098072052001953, -16.745588302612305, -16.393104553222656, -16.040620803833008, -15.68813705444336, -15.335653305053711, -14.983168601989746, -14.630684852600098, -14.27820110321045, -13.9257173538208, -13.573232650756836, -13.220748901367188, -12.868265151977539, -12.51578140258789, -12.163296699523926, -11.810812950134277, -11.458329200744629, -11.10584545135498, -10.753360748291016, -10.400877952575684, -10.048394203186035, -9.695910453796387, -9.343425750732422, -8.990942001342773, -8.638458251953125, -8.285974502563477, -7.93349027633667, -7.581006050109863, -7.228522300720215, -6.876038074493408, -6.52355432510376, -6.171070098876953, -5.818586349487305, -5.466102600097656, -5.11361837387085, -4.761134147644043, -4.4086503982543945, -4.056166172027588, -3.7036824226379395, -3.351198196411133, -2.9987144470214844, -2.646230459213257, -2.2937464714050293, -1.9412624835968018, -1.5887784957885742, -1.2362945079803467, -0.8838106393814087, -0.5313266515731812, -0.1788426637649536, 0.17364120483398438, 0.5261251926422119, 0.8786091804504395, 1.231093168258667, 1.5835771560668945, 1.9360610246658325, 2.2885451316833496, 2.641028881072998, 2.9935128688812256, 3.345996856689453, 3.6984808444976807]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 6.0, 10.0, 4.0, 4.0, 12.0, 12.0, 16.0, 19.0, 22.0, 31.0, 27.0, 24.0, 34.0, 25.0, 18.0, 41.0, 46.0, 51.0, 46.0, 53.0, 54.0, 37.0, 38.0, 48.0, 32.0, 41.0, 38.0, 30.0, 36.0, 22.0, 23.0, 25.0, 18.0, 10.0, 13.0, 12.0, 8.0, 2.0, 7.0, 5.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.86547327041626, -4.707979679107666, -4.550486087799072, -4.3929924964904785, -4.235498905181885, -4.078005313873291, -3.920511484146118, -3.7630178928375244, -3.6055243015289307, -3.448030710220337, -3.290537118911743, -3.1330435276031494, -2.9755496978759766, -2.818056106567383, -2.660562515258789, -2.5030689239501953, -2.3455753326416016, -2.188081741333008, -2.030588150024414, -1.8730944395065308, -1.715600848197937, -1.5581072568893433, -1.40061354637146, -1.2431199550628662, -1.0856263637542725, -0.9281327724456787, -0.7706391215324402, -0.6131454706192017, -0.4556518793106079, -0.29815828800201416, -0.14066463708877563, 0.01682901382446289, 0.17432212829589844, 0.3318157494068146, 0.4893093705177307, 0.6468030214309692, 0.804296612739563, 0.9617902040481567, 1.11928391456604, 1.2767775058746338, 1.4342710971832275, 1.5917646884918213, 1.749258279800415, 1.9067519903182983, 2.0642457008361816, 2.2217392921447754, 2.379232883453369, 2.536726474761963, 2.6942200660705566, 2.8517136573791504, 3.009207248687744, 3.166700839996338, 3.3241944313049316, 3.4816880226135254, 3.6391818523406982, 3.796675443649292, 3.9541690349578857, 4.111662864685059, 4.269156455993652, 4.426650047302246, 4.58414363861084, 4.741637229919434, 4.899130821228027, 5.056624412536621, 5.214118003845215]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 4.0, 2.0, 4.0, 11.0, 13.0, 27.0, 33.0, 68.0, 89.0, 203.0, 322.0, 684.0, 1502.0, 3894.0, 11464.0, 37997.0, 146228.0, 437250.0, 297743.0, 77868.0, 21289.0, 7180.0, 2532.0, 1063.0, 473.0, 247.0, 148.0, 77.0, 46.0, 25.0, 26.0, 17.0, 11.0, 7.0, 5.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.1015625, -3.9483642578125, -3.795166015625, -3.6419677734375, -3.48876953125, -3.3355712890625, -3.182373046875, -3.0291748046875, -2.8759765625, -2.7227783203125, -2.569580078125, -2.4163818359375, -2.26318359375, -2.1099853515625, -1.956787109375, -1.8035888671875, -1.650390625, -1.4971923828125, -1.343994140625, -1.1907958984375, -1.03759765625, -0.8843994140625, -0.731201171875, -0.5780029296875, -0.4248046875, -0.2716064453125, -0.118408203125, 0.0347900390625, 0.18798828125, 0.3411865234375, 0.494384765625, 0.6475830078125, 0.80078125, 0.9539794921875, 1.107177734375, 1.2603759765625, 1.41357421875, 1.5667724609375, 1.719970703125, 1.8731689453125, 2.0263671875, 2.1795654296875, 2.332763671875, 2.4859619140625, 2.63916015625, 2.7923583984375, 2.945556640625, 3.0987548828125, 3.251953125, 3.4051513671875, 3.558349609375, 3.7115478515625, 3.86474609375, 4.0179443359375, 4.171142578125, 4.3243408203125, 4.4775390625, 4.6307373046875, 4.783935546875, 4.9371337890625, 5.09033203125, 5.2435302734375, 5.396728515625, 5.5499267578125, 5.703125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 8.0, 12.0, 4.0, 7.0, 12.0, 11.0, 28.0, 25.0, 33.0, 50.0, 39.0, 58.0, 63.0, 78.0, 74.0, 78.0, 60.0, 68.0, 53.0, 44.0, 48.0, 30.0, 28.0, 26.0, 16.0, 14.0, 12.0, 5.0, 5.0, 2.0, 5.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.00390625, -2.91522216796875, -2.8265380859375, -2.73785400390625, -2.649169921875, -2.56048583984375, -2.4718017578125, -2.38311767578125, -2.29443359375, -2.20574951171875, -2.1170654296875, -2.02838134765625, -1.939697265625, -1.85101318359375, -1.7623291015625, -1.67364501953125, -1.5849609375, -1.49627685546875, -1.4075927734375, -1.31890869140625, -1.230224609375, -1.14154052734375, -1.0528564453125, -0.96417236328125, -0.87548828125, -0.78680419921875, -0.6981201171875, -0.60943603515625, -0.520751953125, -0.43206787109375, -0.3433837890625, -0.25469970703125, -0.166015625, -0.07733154296875, 0.0113525390625, 0.10003662109375, 0.188720703125, 0.27740478515625, 0.3660888671875, 0.45477294921875, 0.54345703125, 0.63214111328125, 0.7208251953125, 0.80950927734375, 0.898193359375, 0.98687744140625, 1.0755615234375, 1.16424560546875, 1.2529296875, 1.34161376953125, 1.4302978515625, 1.51898193359375, 1.607666015625, 1.69635009765625, 1.7850341796875, 1.87371826171875, 1.96240234375, 2.05108642578125, 2.1397705078125, 2.22845458984375, 2.317138671875, 2.40582275390625, 2.4945068359375, 2.58319091796875, 2.671875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 5.0, 10.0, 8.0, 11.0, 14.0, 26.0, 46.0, 54.0, 104.0, 151.0, 486.0, 1495.0, 7990.0, 101113.0, 850146.0, 77757.0, 6899.0, 1396.0, 398.0, 178.0, 92.0, 54.0, 35.0, 23.0, 13.0, 12.0, 7.0, 10.0, 8.0, 5.0, 5.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.625, -15.2078857421875, -14.790771484375, -14.3736572265625, -13.95654296875, -13.5394287109375, -13.122314453125, -12.7052001953125, -12.2880859375, -11.8709716796875, -11.453857421875, -11.0367431640625, -10.61962890625, -10.2025146484375, -9.785400390625, -9.3682861328125, -8.951171875, -8.5340576171875, -8.116943359375, -7.6998291015625, -7.28271484375, -6.8656005859375, -6.448486328125, -6.0313720703125, -5.6142578125, -5.1971435546875, -4.780029296875, -4.3629150390625, -3.94580078125, -3.5286865234375, -3.111572265625, -2.6944580078125, -2.27734375, -1.8602294921875, -1.443115234375, -1.0260009765625, -0.60888671875, -0.1917724609375, 0.225341796875, 0.6424560546875, 1.0595703125, 1.4766845703125, 1.893798828125, 2.3109130859375, 2.72802734375, 3.1451416015625, 3.562255859375, 3.9793701171875, 4.396484375, 4.8135986328125, 5.230712890625, 5.6478271484375, 6.06494140625, 6.4820556640625, 6.899169921875, 7.3162841796875, 7.7333984375, 8.1505126953125, 8.567626953125, 8.9847412109375, 9.40185546875, 9.8189697265625, 10.236083984375, 10.6531982421875, 11.0703125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 3.0, 2.0, 12.0, 3.0, 12.0, 8.0, 11.0, 14.0, 11.0, 18.0, 29.0, 36.0, 39.0, 41.0, 57.0, 53.0, 53.0, 60.0, 60.0, 57.0, 47.0, 60.0, 41.0, 70.0, 43.0, 28.0, 19.0, 22.0, 24.0, 10.0, 12.0, 11.0, 7.0, 5.0, 3.0, 5.0, 5.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.4375, -13.0316162109375, -12.625732421875, -12.2198486328125, -11.81396484375, -11.4080810546875, -11.002197265625, -10.5963134765625, -10.1904296875, -9.7845458984375, -9.378662109375, -8.9727783203125, -8.56689453125, -8.1610107421875, -7.755126953125, -7.3492431640625, -6.943359375, -6.5374755859375, -6.131591796875, -5.7257080078125, -5.31982421875, -4.9139404296875, -4.508056640625, -4.1021728515625, -3.6962890625, -3.2904052734375, -2.884521484375, -2.4786376953125, -2.07275390625, -1.6668701171875, -1.260986328125, -0.8551025390625, -0.44921875, -0.0433349609375, 0.362548828125, 0.7684326171875, 1.17431640625, 1.5802001953125, 1.986083984375, 2.3919677734375, 2.7978515625, 3.2037353515625, 3.609619140625, 4.0155029296875, 4.42138671875, 4.8272705078125, 5.233154296875, 5.6390380859375, 6.044921875, 6.4508056640625, 6.856689453125, 7.2625732421875, 7.66845703125, 8.0743408203125, 8.480224609375, 8.8861083984375, 9.2919921875, 9.6978759765625, 10.103759765625, 10.5096435546875, 10.91552734375, 11.3214111328125, 11.727294921875, 12.1331787109375, 12.5390625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 4.0, 5.0, 7.0, 7.0, 26.0, 74.0, 175.0, 827.0, 12834.0, 1020562.0, 12995.0, 768.0, 173.0, 58.0, 18.0, 21.0, 3.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.0625, -18.5673828125, -18.072265625, -17.5771484375, -17.08203125, -16.5869140625, -16.091796875, -15.5966796875, -15.1015625, -14.6064453125, -14.111328125, -13.6162109375, -13.12109375, -12.6259765625, -12.130859375, -11.6357421875, -11.140625, -10.6455078125, -10.150390625, -9.6552734375, -9.16015625, -8.6650390625, -8.169921875, -7.6748046875, -7.1796875, -6.6845703125, -6.189453125, -5.6943359375, -5.19921875, -4.7041015625, -4.208984375, -3.7138671875, -3.21875, -2.7236328125, -2.228515625, -1.7333984375, -1.23828125, -0.7431640625, -0.248046875, 0.2470703125, 0.7421875, 1.2373046875, 1.732421875, 2.2275390625, 2.72265625, 3.2177734375, 3.712890625, 4.2080078125, 4.703125, 5.1982421875, 5.693359375, 6.1884765625, 6.68359375, 7.1787109375, 7.673828125, 8.1689453125, 8.6640625, 9.1591796875, 9.654296875, 10.1494140625, 10.64453125, 11.1396484375, 11.634765625, 12.1298828125, 12.625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 7.0, 10.0, 14.0, 32.0, 56.0, 73.0, 130.0, 179.0, 166.0, 136.0, 76.0, 56.0, 18.0, 12.0, 17.0, 9.0, 5.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007848739624023438, -0.0007567405700683594, -0.000728607177734375, -0.0007004737854003906, -0.0006723403930664062, -0.0006442070007324219, -0.0006160736083984375, -0.0005879402160644531, -0.0005598068237304688, -0.0005316734313964844, -0.0005035400390625, -0.0004754066467285156, -0.00044727325439453125, -0.0004191398620605469, -0.0003910064697265625, -0.0003628730773925781, -0.00033473968505859375, -0.0003066062927246094, -0.000278472900390625, -0.0002503395080566406, -0.00022220611572265625, -0.00019407272338867188, -0.0001659393310546875, -0.00013780593872070312, -0.00010967254638671875, -8.153915405273438e-05, -5.340576171875e-05, -2.5272369384765625e-05, 2.86102294921875e-06, 3.0994415283203125e-05, 5.91278076171875e-05, 8.726119995117188e-05, 0.00011539459228515625, 0.00014352798461914062, 0.000171661376953125, 0.00019979476928710938, 0.00022792816162109375, 0.0002560615539550781, 0.0002841949462890625, 0.0003123283386230469, 0.00034046173095703125, 0.0003685951232910156, 0.000396728515625, 0.0004248619079589844, 0.00045299530029296875, 0.0004811286926269531, 0.0005092620849609375, 0.0005373954772949219, 0.0005655288696289062, 0.0005936622619628906, 0.000621795654296875, 0.0006499290466308594, 0.0006780624389648438, 0.0007061958312988281, 0.0007343292236328125, 0.0007624626159667969, 0.0007905960083007812, 0.0008187294006347656, 0.00084686279296875, 0.0008749961853027344, 0.0009031295776367188, 0.0009312629699707031, 0.0009593963623046875, 0.0009875297546386719, 0.0010156631469726562]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 8.0, 16.0, 23.0, 71.0, 238.0, 2588.0, 993560.0, 50999.0, 829.0, 132.0, 54.0, 22.0, 9.0, 6.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.65625, -17.063720703125, -16.47119140625, -15.878662109375, -15.2861328125, -14.693603515625, -14.10107421875, -13.508544921875, -12.916015625, -12.323486328125, -11.73095703125, -11.138427734375, -10.5458984375, -9.953369140625, -9.36083984375, -8.768310546875, -8.17578125, -7.583251953125, -6.99072265625, -6.398193359375, -5.8056640625, -5.213134765625, -4.62060546875, -4.028076171875, -3.435546875, -2.843017578125, -2.25048828125, -1.657958984375, -1.0654296875, -0.472900390625, 0.11962890625, 0.712158203125, 1.3046875, 1.897216796875, 2.48974609375, 3.082275390625, 3.6748046875, 4.267333984375, 4.85986328125, 5.452392578125, 6.044921875, 6.637451171875, 7.22998046875, 7.822509765625, 8.4150390625, 9.007568359375, 9.60009765625, 10.192626953125, 10.78515625, 11.377685546875, 11.97021484375, 12.562744140625, 13.1552734375, 13.747802734375, 14.34033203125, 14.932861328125, 15.525390625, 16.117919921875, 16.71044921875, 17.302978515625, 17.8955078125, 18.488037109375, 19.08056640625, 19.673095703125, 20.265625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 4.0, 3.0, 4.0, 5.0, 5.0, 32.0, 91.0, 226.0, 323.0, 196.0, 74.0, 15.0, 10.0, 10.0, 6.0, 2.0, 5.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.748046875, -3.420440673828125, -3.09283447265625, -2.765228271484375, -2.4376220703125, -2.110015869140625, -1.78240966796875, -1.454803466796875, -1.127197265625, -0.799591064453125, -0.47198486328125, -0.144378662109375, 0.1832275390625, 0.510833740234375, 0.83843994140625, 1.166046142578125, 1.49365234375, 1.821258544921875, 2.14886474609375, 2.476470947265625, 2.8040771484375, 3.131683349609375, 3.45928955078125, 3.786895751953125, 4.114501953125, 4.442108154296875, 4.76971435546875, 5.097320556640625, 5.4249267578125, 5.752532958984375, 6.08013916015625, 6.407745361328125, 6.7353515625, 7.062957763671875, 7.39056396484375, 7.718170166015625, 8.0457763671875, 8.373382568359375, 8.70098876953125, 9.028594970703125, 9.356201171875, 9.683807373046875, 10.01141357421875, 10.339019775390625, 10.6666259765625, 10.994232177734375, 11.32183837890625, 11.649444580078125, 11.97705078125, 12.304656982421875, 12.63226318359375, 12.959869384765625, 13.2874755859375, 13.615081787109375, 13.94268798828125, 14.270294189453125, 14.597900390625, 14.925506591796875, 15.25311279296875, 15.580718994140625, 15.9083251953125, 16.235931396484375, 16.56353759765625, 16.891143798828125, 17.21875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 8.0, 17.0, 73.0, 163.0, 308.0, 257.0, 105.0, 38.0, 19.0, 10.0, 6.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-156.6019744873047, -152.19078063964844, -147.77960205078125, -143.368408203125, -138.95721435546875, -134.5460205078125, -130.13482666015625, -125.72364807128906, -121.31245422363281, -116.90126037597656, -112.49007415771484, -108.07888793945312, -103.66769409179688, -99.25650024414062, -94.8453140258789, -90.43412780761719, -86.02293395996094, -81.61174011230469, -77.20055389404297, -72.78936767578125, -68.378173828125, -63.966983795166016, -59.55579376220703, -55.14460372924805, -50.73341369628906, -46.32222366333008, -41.911033630371094, -37.49984359741211, -33.088653564453125, -28.67746353149414, -24.266273498535156, -19.855083465576172, -15.44390869140625, -11.032718658447266, -6.621528625488281, -2.210338592529297, 2.2008514404296875, 6.612041473388672, 11.023231506347656, 15.43442153930664, 19.845611572265625, 24.25680160522461, 28.667991638183594, 33.07918167114258, 37.49037170410156, 41.90156173706055, 46.31275177001953, 50.723941802978516, 55.1351318359375, 59.546321868896484, 63.95751190185547, 68.36869812011719, 72.77989196777344, 77.19108581542969, 81.6022720336914, 86.01345825195312, 90.42465209960938, 94.83584594726562, 99.24703216552734, 103.65821838378906, 108.06941223144531, 112.48060607910156, 116.89179229736328, 121.302978515625, 125.71417236328125]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 3.0, 3.0, 3.0, 6.0, 4.0, 13.0, 9.0, 16.0, 20.0, 19.0, 18.0, 24.0, 48.0, 36.0, 49.0, 48.0, 44.0, 71.0, 43.0, 68.0, 70.0, 39.0, 53.0, 44.0, 44.0, 51.0, 29.0, 34.0, 19.0, 17.0, 15.0, 6.0, 14.0, 7.0, 8.0, 4.0, 2.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.44290542602539, -57.641380310058594, -55.83985137939453, -54.038326263427734, -52.23680114746094, -50.43527603149414, -48.633750915527344, -46.83222198486328, -45.030696868896484, -43.22917175292969, -41.427642822265625, -39.62611770629883, -37.82459259033203, -36.023067474365234, -34.22154235839844, -32.420013427734375, -30.618488311767578, -28.81696319580078, -27.01543617248535, -25.213909149169922, -23.412384033203125, -21.610858917236328, -19.8093318939209, -18.00780487060547, -16.206279754638672, -14.404753684997559, -12.603227615356445, -10.801701545715332, -9.000175476074219, -7.1986494064331055, -5.397123336791992, -3.595597267150879, -1.7940673828125, 0.007458686828613281, 1.8089847564697266, 3.61051082611084, 5.412036895751953, 7.213562965393066, 9.01508903503418, 10.816615104675293, 12.618141174316406, 14.41966724395752, 16.221193313598633, 18.022720336914062, 19.82424545288086, 21.625770568847656, 23.427297592163086, 25.228824615478516, 27.030349731445312, 28.83187484741211, 30.63340187072754, 32.43492889404297, 34.236454010009766, 36.03797912597656, 37.839508056640625, 39.64103317260742, 41.44255828857422, 43.244083404541016, 45.04560852050781, 46.847137451171875, 48.64866256713867, 50.45018768310547, 52.25171661376953, 54.05324172973633, 55.854766845703125]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 5.0, 6.0, 5.0, 14.0, 19.0, 24.0, 29.0, 44.0, 101.0, 155.0, 246.0, 542.0, 1171.0, 3373.0, 16257.0, 4103154.0, 58975.0, 6726.0, 1895.0, 800.0, 338.0, 159.0, 88.0, 45.0, 31.0, 25.0, 17.0, 7.0, 7.0, 7.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0], "bins": [-13.703125, -13.38250732421875, -13.0618896484375, -12.74127197265625, -12.420654296875, -12.10003662109375, -11.7794189453125, -11.45880126953125, -11.13818359375, -10.81756591796875, -10.4969482421875, -10.17633056640625, -9.855712890625, -9.53509521484375, -9.2144775390625, -8.89385986328125, -8.5732421875, -8.25262451171875, -7.9320068359375, -7.61138916015625, -7.290771484375, -6.97015380859375, -6.6495361328125, -6.32891845703125, -6.00830078125, -5.68768310546875, -5.3670654296875, -5.04644775390625, -4.725830078125, -4.40521240234375, -4.0845947265625, -3.76397705078125, -3.443359375, -3.12274169921875, -2.8021240234375, -2.48150634765625, -2.160888671875, -1.84027099609375, -1.5196533203125, -1.19903564453125, -0.87841796875, -0.55780029296875, -0.2371826171875, 0.08343505859375, 0.404052734375, 0.72467041015625, 1.0452880859375, 1.36590576171875, 1.6865234375, 2.00714111328125, 2.3277587890625, 2.64837646484375, 2.968994140625, 3.28961181640625, 3.6102294921875, 3.93084716796875, 4.25146484375, 4.57208251953125, 4.8927001953125, 5.21331787109375, 5.533935546875, 5.85455322265625, 6.1751708984375, 6.49578857421875, 6.81640625]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 4.0, 2.0, 4.0, 3.0, 5.0, 9.0, 5.0, 11.0, 6.0, 15.0, 27.0, 33.0, 44.0, 53.0, 48.0, 82.0, 53.0, 67.0, 97.0, 78.0, 65.0, 65.0, 57.0, 36.0, 30.0, 24.0, 20.0, 17.0, 12.0, 7.0, 6.0, 5.0, 4.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-4.22265625, -4.11444091796875, -4.0062255859375, -3.89801025390625, -3.789794921875, -3.68157958984375, -3.5733642578125, -3.46514892578125, -3.35693359375, -3.24871826171875, -3.1405029296875, -3.03228759765625, -2.924072265625, -2.81585693359375, -2.7076416015625, -2.59942626953125, -2.4912109375, -2.38299560546875, -2.2747802734375, -2.16656494140625, -2.058349609375, -1.95013427734375, -1.8419189453125, -1.73370361328125, -1.62548828125, -1.51727294921875, -1.4090576171875, -1.30084228515625, -1.192626953125, -1.08441162109375, -0.9761962890625, -0.86798095703125, -0.759765625, -0.65155029296875, -0.5433349609375, -0.43511962890625, -0.326904296875, -0.21868896484375, -0.1104736328125, -0.00225830078125, 0.10595703125, 0.21417236328125, 0.3223876953125, 0.43060302734375, 0.538818359375, 0.64703369140625, 0.7552490234375, 0.86346435546875, 0.9716796875, 1.07989501953125, 1.1881103515625, 1.29632568359375, 1.404541015625, 1.51275634765625, 1.6209716796875, 1.72918701171875, 1.83740234375, 1.94561767578125, 2.0538330078125, 2.16204833984375, 2.270263671875, 2.37847900390625, 2.4866943359375, 2.59490966796875, 2.703125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 1.0, 3.0, 4.0, 4.0, 13.0, 5.0, 12.0, 20.0, 34.0, 41.0, 65.0, 96.0, 119.0, 216.0, 305.0, 403.0, 622.0, 985.0, 1707.0, 3193.0, 6406.0, 17721.0, 141559.0, 3977910.0, 25532.0, 8244.0, 3825.0, 1916.0, 1148.0, 722.0, 451.0, 306.0, 200.0, 140.0, 115.0, 78.0, 55.0, 34.0, 23.0, 16.0, 7.0, 9.0, 12.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.2265625, -8.909912109375, -8.59326171875, -8.276611328125, -7.9599609375, -7.643310546875, -7.32666015625, -7.010009765625, -6.693359375, -6.376708984375, -6.06005859375, -5.743408203125, -5.4267578125, -5.110107421875, -4.79345703125, -4.476806640625, -4.16015625, -3.843505859375, -3.52685546875, -3.210205078125, -2.8935546875, -2.576904296875, -2.26025390625, -1.943603515625, -1.626953125, -1.310302734375, -0.99365234375, -0.677001953125, -0.3603515625, -0.043701171875, 0.27294921875, 0.589599609375, 0.90625, 1.222900390625, 1.53955078125, 1.856201171875, 2.1728515625, 2.489501953125, 2.80615234375, 3.122802734375, 3.439453125, 3.756103515625, 4.07275390625, 4.389404296875, 4.7060546875, 5.022705078125, 5.33935546875, 5.656005859375, 5.97265625, 6.289306640625, 6.60595703125, 6.922607421875, 7.2392578125, 7.555908203125, 7.87255859375, 8.189208984375, 8.505859375, 8.822509765625, 9.13916015625, 9.455810546875, 9.7724609375, 10.089111328125, 10.40576171875, 10.722412109375, 11.0390625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 10.0, 12.0, 12.0, 39.0, 69.0, 3617.0, 204.0, 48.0, 22.0, 4.0, 10.0, 8.0, 5.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.65625, -2.55352783203125, -2.4508056640625, -2.34808349609375, -2.245361328125, -2.14263916015625, -2.0399169921875, -1.93719482421875, -1.83447265625, -1.73175048828125, -1.6290283203125, -1.52630615234375, -1.423583984375, -1.32086181640625, -1.2181396484375, -1.11541748046875, -1.0126953125, -0.90997314453125, -0.8072509765625, -0.70452880859375, -0.601806640625, -0.49908447265625, -0.3963623046875, -0.29364013671875, -0.19091796875, -0.08819580078125, 0.0145263671875, 0.11724853515625, 0.219970703125, 0.32269287109375, 0.4254150390625, 0.52813720703125, 0.630859375, 0.73358154296875, 0.8363037109375, 0.93902587890625, 1.041748046875, 1.14447021484375, 1.2471923828125, 1.34991455078125, 1.45263671875, 1.55535888671875, 1.6580810546875, 1.76080322265625, 1.863525390625, 1.96624755859375, 2.0689697265625, 2.17169189453125, 2.2744140625, 2.37713623046875, 2.4798583984375, 2.58258056640625, 2.685302734375, 2.78802490234375, 2.8907470703125, 2.99346923828125, 3.09619140625, 3.19891357421875, 3.3016357421875, 3.40435791015625, 3.507080078125, 3.60980224609375, 3.7125244140625, 3.81524658203125, 3.91796875]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 9.0, 10.0, 15.0, 19.0, 38.0, 42.0, 67.0, 78.0, 98.0, 123.0, 108.0, 115.0, 86.0, 59.0, 43.0, 34.0, 21.0, 6.0, 12.0, 3.0, 4.0, 1.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.610106468200684, -8.326332092285156, -8.042557716369629, -7.758783340454102, -7.475008964538574, -7.191234588623047, -6.9074602127075195, -6.623685836791992, -6.339911460876465, -6.0561370849609375, -5.77236270904541, -5.488588333129883, -5.2048139572143555, -4.921039581298828, -4.637265205383301, -4.353490829467773, -4.069716453552246, -3.7859420776367188, -3.5021677017211914, -3.218393325805664, -2.9346189498901367, -2.6508445739746094, -2.367070198059082, -2.0832958221435547, -1.7995214462280273, -1.5157470703125, -1.2319726943969727, -0.9481983184814453, -0.664423942565918, -0.3806495666503906, -0.09687519073486328, 0.18689918518066406, 0.4706745147705078, 0.7544488906860352, 1.0382232666015625, 1.3219976425170898, 1.6057720184326172, 1.8895463943481445, 2.173320770263672, 2.457095146179199, 2.7408695220947266, 3.024643898010254, 3.3084182739257812, 3.5921926498413086, 3.875967025756836, 4.159741401672363, 4.443515777587891, 4.727290153503418, 5.011064529418945, 5.294838905334473, 5.57861328125, 5.862387657165527, 6.146162033081055, 6.429936408996582, 6.713710784912109, 6.997485160827637, 7.281259536743164, 7.565033912658691, 7.848808288574219, 8.132582664489746, 8.416357040405273, 8.7001314163208, 8.983905792236328, 9.267680168151855, 9.551454544067383]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 9.0, 9.0, 10.0, 10.0, 19.0, 17.0, 20.0, 25.0, 28.0, 30.0, 33.0, 46.0, 56.0, 39.0, 54.0, 54.0, 50.0, 58.0, 55.0, 61.0, 44.0, 42.0, 33.0, 41.0, 26.0, 24.0, 19.0, 22.0, 13.0, 15.0, 8.0, 10.0, 4.0, 4.0, 5.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.873305320739746, -5.667628765106201, -5.461951732635498, -5.256275177001953, -5.05059814453125, -4.844921588897705, -4.63924503326416, -4.433568000793457, -4.227890968322754, -4.022214412689209, -3.816537380218506, -3.610860824584961, -3.405183792114258, -3.199507236480713, -2.993830442428589, -2.788153648376465, -2.58247709274292, -2.376800298690796, -2.171123504638672, -1.9654468297958374, -1.7597700357437134, -1.5540932416915894, -1.3484165668487549, -1.1427397727966309, -0.9370629787445068, -0.7313861846923828, -0.5257094502449036, -0.3200327157974243, -0.11435592174530029, 0.09132087230682373, 0.2969975471496582, 0.5026743412017822, 0.7083511352539062, 0.9140279293060303, 1.1197047233581543, 1.3253813982009888, 1.5310581922531128, 1.7367349863052368, 1.9424116611480713, 2.1480884552001953, 2.3537652492523193, 2.5594420433044434, 2.7651188373565674, 2.9707956314086914, 3.1764721870422363, 3.3821492195129395, 3.5878257751464844, 3.7935025691986084, 3.9991793632507324, 4.204855918884277, 4.4105329513549805, 4.616209506988525, 4.8218865394592285, 5.027563095092773, 5.233240127563477, 5.4389166831970215, 5.644593238830566, 5.850269794464111, 6.0559468269348145, 6.261623382568359, 6.4673004150390625, 6.672976970672607, 6.878653526306152, 7.0843305587768555, 7.290007591247559]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 6.0, 7.0, 9.0, 20.0, 18.0, 43.0, 53.0, 79.0, 113.0, 149.0, 232.0, 382.0, 626.0, 968.0, 1818.0, 3249.0, 6495.0, 13583.0, 31615.0, 82264.0, 218596.0, 370335.0, 192532.0, 71682.0, 28390.0, 12307.0, 5738.0, 3049.0, 1646.0, 933.0, 557.0, 384.0, 241.0, 142.0, 96.0, 60.0, 34.0, 28.0, 26.0, 15.0, 9.0, 11.0, 3.0, 2.0, 3.0, 7.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.6484375, -4.50054931640625, -4.3526611328125, -4.20477294921875, -4.056884765625, -3.90899658203125, -3.7611083984375, -3.61322021484375, -3.46533203125, -3.31744384765625, -3.1695556640625, -3.02166748046875, -2.873779296875, -2.72589111328125, -2.5780029296875, -2.43011474609375, -2.2822265625, -2.13433837890625, -1.9864501953125, -1.83856201171875, -1.690673828125, -1.54278564453125, -1.3948974609375, -1.24700927734375, -1.09912109375, -0.95123291015625, -0.8033447265625, -0.65545654296875, -0.507568359375, -0.35968017578125, -0.2117919921875, -0.06390380859375, 0.083984375, 0.23187255859375, 0.3797607421875, 0.52764892578125, 0.675537109375, 0.82342529296875, 0.9713134765625, 1.11920166015625, 1.26708984375, 1.41497802734375, 1.5628662109375, 1.71075439453125, 1.858642578125, 2.00653076171875, 2.1544189453125, 2.30230712890625, 2.4501953125, 2.59808349609375, 2.7459716796875, 2.89385986328125, 3.041748046875, 3.18963623046875, 3.3375244140625, 3.48541259765625, 3.63330078125, 3.78118896484375, 3.9290771484375, 4.07696533203125, 4.224853515625, 4.37274169921875, 4.5206298828125, 4.66851806640625, 4.81640625]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 2.0, 7.0, 2.0, 4.0, 7.0, 8.0, 12.0, 16.0, 16.0, 28.0, 29.0, 36.0, 61.0, 56.0, 71.0, 59.0, 74.0, 80.0, 61.0, 67.0, 67.0, 47.0, 38.0, 28.0, 29.0, 34.0, 16.0, 10.0, 10.0, 4.0, 4.0, 8.0, 3.0, 3.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.265625, -4.153839111328125, -4.04205322265625, -3.930267333984375, -3.8184814453125, -3.706695556640625, -3.59490966796875, -3.483123779296875, -3.371337890625, -3.259552001953125, -3.14776611328125, -3.035980224609375, -2.9241943359375, -2.812408447265625, -2.70062255859375, -2.588836669921875, -2.47705078125, -2.365264892578125, -2.25347900390625, -2.141693115234375, -2.0299072265625, -1.918121337890625, -1.80633544921875, -1.694549560546875, -1.582763671875, -1.470977783203125, -1.35919189453125, -1.247406005859375, -1.1356201171875, -1.023834228515625, -0.91204833984375, -0.800262451171875, -0.6884765625, -0.576690673828125, -0.46490478515625, -0.353118896484375, -0.2413330078125, -0.129547119140625, -0.01776123046875, 0.094024658203125, 0.205810546875, 0.317596435546875, 0.42938232421875, 0.541168212890625, 0.6529541015625, 0.764739990234375, 0.87652587890625, 0.988311767578125, 1.10009765625, 1.211883544921875, 1.32366943359375, 1.435455322265625, 1.5472412109375, 1.659027099609375, 1.77081298828125, 1.882598876953125, 1.994384765625, 2.106170654296875, 2.21795654296875, 2.329742431640625, 2.4415283203125, 2.553314208984375, 2.66510009765625, 2.776885986328125, 2.888671875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 4.0, 7.0, 7.0, 11.0, 9.0, 25.0, 22.0, 39.0, 76.0, 124.0, 248.0, 540.0, 1156.0, 3600.0, 19061.0, 254297.0, 709075.0, 50176.0, 6827.0, 1860.0, 655.0, 307.0, 167.0, 83.0, 63.0, 37.0, 16.0, 17.0, 12.0, 12.0, 6.0, 8.0, 2.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.9453125, -15.516845703125, -15.08837890625, -14.659912109375, -14.2314453125, -13.802978515625, -13.37451171875, -12.946044921875, -12.517578125, -12.089111328125, -11.66064453125, -11.232177734375, -10.8037109375, -10.375244140625, -9.94677734375, -9.518310546875, -9.08984375, -8.661376953125, -8.23291015625, -7.804443359375, -7.3759765625, -6.947509765625, -6.51904296875, -6.090576171875, -5.662109375, -5.233642578125, -4.80517578125, -4.376708984375, -3.9482421875, -3.519775390625, -3.09130859375, -2.662841796875, -2.234375, -1.805908203125, -1.37744140625, -0.948974609375, -0.5205078125, -0.092041015625, 0.33642578125, 0.764892578125, 1.193359375, 1.621826171875, 2.05029296875, 2.478759765625, 2.9072265625, 3.335693359375, 3.76416015625, 4.192626953125, 4.62109375, 5.049560546875, 5.47802734375, 5.906494140625, 6.3349609375, 6.763427734375, 7.19189453125, 7.620361328125, 8.048828125, 8.477294921875, 8.90576171875, 9.334228515625, 9.7626953125, 10.191162109375, 10.61962890625, 11.048095703125, 11.4765625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 2.0, 2.0, 7.0, 4.0, 4.0, 8.0, 11.0, 18.0, 8.0, 20.0, 13.0, 20.0, 30.0, 22.0, 38.0, 40.0, 56.0, 56.0, 44.0, 51.0, 66.0, 55.0, 56.0, 58.0, 43.0, 51.0, 41.0, 31.0, 30.0, 20.0, 16.0, 15.0, 15.0, 13.0, 11.0, 12.0, 4.0, 4.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.4609375, -12.9945068359375, -12.528076171875, -12.0616455078125, -11.59521484375, -11.1287841796875, -10.662353515625, -10.1959228515625, -9.7294921875, -9.2630615234375, -8.796630859375, -8.3302001953125, -7.86376953125, -7.3973388671875, -6.930908203125, -6.4644775390625, -5.998046875, -5.5316162109375, -5.065185546875, -4.5987548828125, -4.13232421875, -3.6658935546875, -3.199462890625, -2.7330322265625, -2.2666015625, -1.8001708984375, -1.333740234375, -0.8673095703125, -0.40087890625, 0.0655517578125, 0.531982421875, 0.9984130859375, 1.46484375, 1.9312744140625, 2.397705078125, 2.8641357421875, 3.33056640625, 3.7969970703125, 4.263427734375, 4.7298583984375, 5.1962890625, 5.6627197265625, 6.129150390625, 6.5955810546875, 7.06201171875, 7.5284423828125, 7.994873046875, 8.4613037109375, 8.927734375, 9.3941650390625, 9.860595703125, 10.3270263671875, 10.79345703125, 11.2598876953125, 11.726318359375, 12.1927490234375, 12.6591796875, 13.1256103515625, 13.592041015625, 14.0584716796875, 14.52490234375, 14.9913330078125, 15.457763671875, 15.9241943359375, 16.390625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 1.0, 5.0, 1.0, 3.0, 18.0, 18.0, 19.0, 24.0, 52.0, 111.0, 169.0, 502.0, 1566.0, 10858.0, 612636.0, 411610.0, 8787.0, 1360.0, 433.0, 169.0, 94.0, 54.0, 31.0, 14.0, 7.0, 6.0, 2.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.8671875, -11.5843505859375, -11.301513671875, -11.0186767578125, -10.73583984375, -10.4530029296875, -10.170166015625, -9.8873291015625, -9.6044921875, -9.3216552734375, -9.038818359375, -8.7559814453125, -8.47314453125, -8.1903076171875, -7.907470703125, -7.6246337890625, -7.341796875, -7.0589599609375, -6.776123046875, -6.4932861328125, -6.21044921875, -5.9276123046875, -5.644775390625, -5.3619384765625, -5.0791015625, -4.7962646484375, -4.513427734375, -4.2305908203125, -3.94775390625, -3.6649169921875, -3.382080078125, -3.0992431640625, -2.81640625, -2.5335693359375, -2.250732421875, -1.9678955078125, -1.68505859375, -1.4022216796875, -1.119384765625, -0.8365478515625, -0.5537109375, -0.2708740234375, 0.011962890625, 0.2947998046875, 0.57763671875, 0.8604736328125, 1.143310546875, 1.4261474609375, 1.708984375, 1.9918212890625, 2.274658203125, 2.5574951171875, 2.84033203125, 3.1231689453125, 3.406005859375, 3.6888427734375, 3.9716796875, 4.2545166015625, 4.537353515625, 4.8201904296875, 5.10302734375, 5.3858642578125, 5.668701171875, 5.9515380859375, 6.234375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 4.0, 2.0, 6.0, 6.0, 12.0, 5.0, 23.0, 22.0, 32.0, 29.0, 53.0, 70.0, 73.0, 111.0, 91.0, 79.0, 99.0, 71.0, 51.0, 35.0, 40.0, 26.0, 21.0, 15.0, 8.0, 5.0, 5.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0007143020629882812, -0.0006958246231079102, -0.0006773471832275391, -0.000658869743347168, -0.0006403923034667969, -0.0006219148635864258, -0.0006034374237060547, -0.0005849599838256836, -0.0005664825439453125, -0.0005480051040649414, -0.0005295276641845703, -0.0005110502243041992, -0.0004925727844238281, -0.00047409534454345703, -0.00045561790466308594, -0.00043714046478271484, -0.00041866302490234375, -0.00040018558502197266, -0.00038170814514160156, -0.00036323070526123047, -0.0003447532653808594, -0.0003262758255004883, -0.0003077983856201172, -0.0002893209457397461, -0.000270843505859375, -0.0002523660659790039, -0.0002338886260986328, -0.00021541118621826172, -0.00019693374633789062, -0.00017845630645751953, -0.00015997886657714844, -0.00014150142669677734, -0.00012302398681640625, -0.00010454654693603516, -8.606910705566406e-05, -6.759166717529297e-05, -4.9114227294921875e-05, -3.063678741455078e-05, -1.2159347534179688e-05, 6.318092346191406e-06, 2.47955322265625e-05, 4.3272972106933594e-05, 6.175041198730469e-05, 8.022785186767578e-05, 9.870529174804688e-05, 0.00011718273162841797, 0.00013566017150878906, 0.00015413761138916016, 0.00017261505126953125, 0.00019109249114990234, 0.00020956993103027344, 0.00022804737091064453, 0.0002465248107910156, 0.0002650022506713867, 0.0002834796905517578, 0.0003019571304321289, 0.0003204345703125, 0.0003389120101928711, 0.0003573894500732422, 0.0003758668899536133, 0.0003943443298339844, 0.00041282176971435547, 0.00043129920959472656, 0.00044977664947509766, 0.00046825408935546875]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 2.0, 8.0, 8.0, 17.0, 23.0, 35.0, 52.0, 100.0, 191.0, 396.0, 1170.0, 4598.0, 41298.0, 805507.0, 181552.0, 10535.0, 1922.0, 576.0, 250.0, 119.0, 77.0, 41.0, 24.0, 19.0, 10.0, 7.0, 4.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0], "bins": [-8.65625, -8.44879150390625, -8.2413330078125, -8.03387451171875, -7.826416015625, -7.61895751953125, -7.4114990234375, -7.20404052734375, -6.99658203125, -6.78912353515625, -6.5816650390625, -6.37420654296875, -6.166748046875, -5.95928955078125, -5.7518310546875, -5.54437255859375, -5.3369140625, -5.12945556640625, -4.9219970703125, -4.71453857421875, -4.507080078125, -4.29962158203125, -4.0921630859375, -3.88470458984375, -3.67724609375, -3.46978759765625, -3.2623291015625, -3.05487060546875, -2.847412109375, -2.63995361328125, -2.4324951171875, -2.22503662109375, -2.017578125, -1.81011962890625, -1.6026611328125, -1.39520263671875, -1.187744140625, -0.98028564453125, -0.7728271484375, -0.56536865234375, -0.35791015625, -0.15045166015625, 0.0570068359375, 0.26446533203125, 0.471923828125, 0.67938232421875, 0.8868408203125, 1.09429931640625, 1.3017578125, 1.50921630859375, 1.7166748046875, 1.92413330078125, 2.131591796875, 2.33905029296875, 2.5465087890625, 2.75396728515625, 2.96142578125, 3.16888427734375, 3.3763427734375, 3.58380126953125, 3.791259765625, 3.99871826171875, 4.2061767578125, 4.41363525390625, 4.62109375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 5.0, 3.0, 4.0, 3.0, 9.0, 11.0, 16.0, 27.0, 32.0, 53.0, 76.0, 101.0, 113.0, 137.0, 136.0, 99.0, 64.0, 39.0, 35.0, 20.0, 9.0, 5.0, 6.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.3984375, -8.2083740234375, -8.018310546875, -7.8282470703125, -7.63818359375, -7.4481201171875, -7.258056640625, -7.0679931640625, -6.8779296875, -6.6878662109375, -6.497802734375, -6.3077392578125, -6.11767578125, -5.9276123046875, -5.737548828125, -5.5474853515625, -5.357421875, -5.1673583984375, -4.977294921875, -4.7872314453125, -4.59716796875, -4.4071044921875, -4.217041015625, -4.0269775390625, -3.8369140625, -3.6468505859375, -3.456787109375, -3.2667236328125, -3.07666015625, -2.8865966796875, -2.696533203125, -2.5064697265625, -2.31640625, -2.1263427734375, -1.936279296875, -1.7462158203125, -1.55615234375, -1.3660888671875, -1.176025390625, -0.9859619140625, -0.7958984375, -0.6058349609375, -0.415771484375, -0.2257080078125, -0.03564453125, 0.1544189453125, 0.344482421875, 0.5345458984375, 0.724609375, 0.9146728515625, 1.104736328125, 1.2947998046875, 1.48486328125, 1.6749267578125, 1.864990234375, 2.0550537109375, 2.2451171875, 2.4351806640625, 2.625244140625, 2.8153076171875, 3.00537109375, 3.1954345703125, 3.385498046875, 3.5755615234375, 3.765625]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 9.0, 20.0, 30.0, 109.0, 196.0, 258.0, 211.0, 103.0, 50.0, 14.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-221.7382354736328, -217.44447326660156, -213.1507110595703, -208.85693359375, -204.56317138671875, -200.2694091796875, -195.97564697265625, -191.681884765625, -187.3881072998047, -183.09434509277344, -178.8005828857422, -174.50680541992188, -170.21304321289062, -165.91928100585938, -161.62551879882812, -157.33175659179688, -153.03799438476562, -148.74423217773438, -144.45046997070312, -140.1566925048828, -135.86293029785156, -131.5691680908203, -127.27540588378906, -122.98163604736328, -118.6878662109375, -114.39410400390625, -110.10033416748047, -105.80657196044922, -101.51280212402344, -97.21903991699219, -92.92527770996094, -88.63150787353516, -84.33773803710938, -80.04397583007812, -75.75020599365234, -71.4564437866211, -67.16267395019531, -62.86891174316406, -58.57514572143555, -54.28137969970703, -49.98761749267578, -45.693851470947266, -41.40008544921875, -37.1063232421875, -32.81255340576172, -28.518789291381836, -24.225025177001953, -19.931259155273438, -15.637493133544922, -11.343727111816406, -7.049962043762207, -2.756196975708008, 1.5375690460205078, 5.831335067749023, 10.125099182128906, 14.418865203857422, 18.712631225585938, 23.006397247314453, 27.30016326904297, 31.59392738342285, 35.8876953125, 40.18145751953125, 44.475223541259766, 48.76898956298828, 53.0627555847168]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 8.0, 4.0, 6.0, 7.0, 11.0, 15.0, 4.0, 16.0, 16.0, 19.0, 23.0, 28.0, 36.0, 41.0, 42.0, 43.0, 62.0, 72.0, 72.0, 51.0, 62.0, 47.0, 45.0, 56.0, 42.0, 40.0, 24.0, 22.0, 18.0, 13.0, 15.0, 13.0, 6.0, 13.0, 9.0, 5.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-91.30396270751953, -89.07377624511719, -86.84359741210938, -84.61341094970703, -82.38323211669922, -80.15304565429688, -77.92286682128906, -75.69268035888672, -73.46249389648438, -71.23230743408203, -69.00212860107422, -66.77194213867188, -64.54176330566406, -62.31157684326172, -60.08139419555664, -57.85121154785156, -55.62103271484375, -53.39085006713867, -51.160667419433594, -48.930484771728516, -46.70030212402344, -44.470115661621094, -42.239933013916016, -40.00975036621094, -37.77956771850586, -35.54938507080078, -33.3192024230957, -31.089017868041992, -28.858835220336914, -26.628652572631836, -24.398468017578125, -22.168285369873047, -19.9381103515625, -17.707927703857422, -15.477744102478027, -13.247560501098633, -11.017377853393555, -8.787195205688477, -6.557011604309082, -4.3268280029296875, -2.0966453552246094, 0.13353776931762695, 2.3637208938598633, 4.5939040184021, 6.824087142944336, 9.054269790649414, 11.284453392028809, 13.514636993408203, 15.744819641113281, 17.97500228881836, 20.205184936523438, 22.43536949157715, 24.665552139282227, 26.895734786987305, 29.125919342041016, 31.356101989746094, 33.58628463745117, 35.81646728515625, 38.04664993286133, 40.276832580566406, 42.50701904296875, 44.73719787597656, 46.967384338378906, 49.197566986083984, 51.42774963378906]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 4.0, 11.0, 9.0, 11.0, 9.0, 10.0, 20.0, 25.0, 33.0, 44.0, 65.0, 117.0, 182.0, 347.0, 666.0, 1638.0, 4433.0, 20373.0, 4026224.0, 124270.0, 10675.0, 2803.0, 1171.0, 523.0, 244.0, 145.0, 93.0, 50.0, 29.0, 21.0, 16.0, 7.0, 6.0, 2.0, 2.0, 3.0, 0.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.1640625, -14.7630615234375, -14.362060546875, -13.9610595703125, -13.56005859375, -13.1590576171875, -12.758056640625, -12.3570556640625, -11.9560546875, -11.5550537109375, -11.154052734375, -10.7530517578125, -10.35205078125, -9.9510498046875, -9.550048828125, -9.1490478515625, -8.748046875, -8.3470458984375, -7.946044921875, -7.5450439453125, -7.14404296875, -6.7430419921875, -6.342041015625, -5.9410400390625, -5.5400390625, -5.1390380859375, -4.738037109375, -4.3370361328125, -3.93603515625, -3.5350341796875, -3.134033203125, -2.7330322265625, -2.33203125, -1.9310302734375, -1.530029296875, -1.1290283203125, -0.72802734375, -0.3270263671875, 0.073974609375, 0.4749755859375, 0.8759765625, 1.2769775390625, 1.677978515625, 2.0789794921875, 2.47998046875, 2.8809814453125, 3.281982421875, 3.6829833984375, 4.083984375, 4.4849853515625, 4.885986328125, 5.2869873046875, 5.68798828125, 6.0889892578125, 6.489990234375, 6.8909912109375, 7.2919921875, 7.6929931640625, 8.093994140625, 8.4949951171875, 8.89599609375, 9.2969970703125, 9.697998046875, 10.0989990234375, 10.5]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 0.0, 2.0, 4.0, 0.0, 6.0, 6.0, 10.0, 12.0, 18.0, 14.0, 34.0, 49.0, 69.0, 96.0, 91.0, 118.0, 115.0, 83.0, 80.0, 54.0, 40.0, 33.0, 23.0, 20.0, 4.0, 7.0, 3.0, 5.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.70703125, -6.53717041015625, -6.3673095703125, -6.19744873046875, -6.027587890625, -5.85772705078125, -5.6878662109375, -5.51800537109375, -5.34814453125, -5.17828369140625, -5.0084228515625, -4.83856201171875, -4.668701171875, -4.49884033203125, -4.3289794921875, -4.15911865234375, -3.9892578125, -3.81939697265625, -3.6495361328125, -3.47967529296875, -3.309814453125, -3.13995361328125, -2.9700927734375, -2.80023193359375, -2.63037109375, -2.46051025390625, -2.2906494140625, -2.12078857421875, -1.950927734375, -1.78106689453125, -1.6112060546875, -1.44134521484375, -1.271484375, -1.10162353515625, -0.9317626953125, -0.76190185546875, -0.592041015625, -0.42218017578125, -0.2523193359375, -0.08245849609375, 0.08740234375, 0.25726318359375, 0.4271240234375, 0.59698486328125, 0.766845703125, 0.93670654296875, 1.1065673828125, 1.27642822265625, 1.4462890625, 1.61614990234375, 1.7860107421875, 1.95587158203125, 2.125732421875, 2.29559326171875, 2.4654541015625, 2.63531494140625, 2.80517578125, 2.97503662109375, 3.1448974609375, 3.31475830078125, 3.484619140625, 3.65447998046875, 3.8243408203125, 3.99420166015625, 4.1640625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 1.0, 4.0, 3.0, 8.0, 7.0, 12.0, 29.0, 37.0, 37.0, 69.0, 111.0, 170.0, 290.0, 448.0, 741.0, 1500.0, 3509.0, 11471.0, 97178.0, 4025778.0, 39849.0, 7533.0, 2635.0, 1222.0, 613.0, 387.0, 241.0, 143.0, 93.0, 56.0, 38.0, 22.0, 13.0, 13.0, 10.0, 8.0, 2.0, 4.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.4765625, -14.0289306640625, -13.581298828125, -13.1336669921875, -12.68603515625, -12.2384033203125, -11.790771484375, -11.3431396484375, -10.8955078125, -10.4478759765625, -10.000244140625, -9.5526123046875, -9.10498046875, -8.6573486328125, -8.209716796875, -7.7620849609375, -7.314453125, -6.8668212890625, -6.419189453125, -5.9715576171875, -5.52392578125, -5.0762939453125, -4.628662109375, -4.1810302734375, -3.7333984375, -3.2857666015625, -2.838134765625, -2.3905029296875, -1.94287109375, -1.4952392578125, -1.047607421875, -0.5999755859375, -0.15234375, 0.2952880859375, 0.742919921875, 1.1905517578125, 1.63818359375, 2.0858154296875, 2.533447265625, 2.9810791015625, 3.4287109375, 3.8763427734375, 4.323974609375, 4.7716064453125, 5.21923828125, 5.6668701171875, 6.114501953125, 6.5621337890625, 7.009765625, 7.4573974609375, 7.905029296875, 8.3526611328125, 8.80029296875, 9.2479248046875, 9.695556640625, 10.1431884765625, 10.5908203125, 11.0384521484375, 11.486083984375, 11.9337158203125, 12.38134765625, 12.8289794921875, 13.276611328125, 13.7242431640625, 14.171875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 4.0, 2.0, 6.0, 9.0, 6.0, 15.0, 25.0, 66.0, 182.0, 3385.0, 224.0, 71.0, 33.0, 19.0, 14.0, 6.0, 4.0, 1.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.06640625, -5.8543701171875, -5.642333984375, -5.4302978515625, -5.21826171875, -5.0062255859375, -4.794189453125, -4.5821533203125, -4.3701171875, -4.1580810546875, -3.946044921875, -3.7340087890625, -3.52197265625, -3.3099365234375, -3.097900390625, -2.8858642578125, -2.673828125, -2.4617919921875, -2.249755859375, -2.0377197265625, -1.82568359375, -1.6136474609375, -1.401611328125, -1.1895751953125, -0.9775390625, -0.7655029296875, -0.553466796875, -0.3414306640625, -0.12939453125, 0.0826416015625, 0.294677734375, 0.5067138671875, 0.71875, 0.9307861328125, 1.142822265625, 1.3548583984375, 1.56689453125, 1.7789306640625, 1.990966796875, 2.2030029296875, 2.4150390625, 2.6270751953125, 2.839111328125, 3.0511474609375, 3.26318359375, 3.4752197265625, 3.687255859375, 3.8992919921875, 4.111328125, 4.3233642578125, 4.535400390625, 4.7474365234375, 4.95947265625, 5.1715087890625, 5.383544921875, 5.5955810546875, 5.8076171875, 6.0196533203125, 6.231689453125, 6.4437255859375, 6.65576171875, 6.8677978515625, 7.079833984375, 7.2918701171875, 7.50390625]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 1.0, 3.0, 2.0, 7.0, 10.0, 9.0, 10.0, 14.0, 28.0, 26.0, 48.0, 91.0, 83.0, 125.0, 143.0, 133.0, 90.0, 57.0, 54.0, 21.0, 17.0, 12.0, 7.0, 5.0, 5.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.181058883666992, -24.566375732421875, -23.95169448852539, -23.337011337280273, -22.72233009338379, -22.107646942138672, -21.492965698242188, -20.87828254699707, -20.263599395751953, -19.648916244506836, -19.03423500061035, -18.419551849365234, -17.80487060546875, -17.190187454223633, -16.575504302978516, -15.960823059082031, -15.34614086151123, -14.73145866394043, -14.116776466369629, -13.502094268798828, -12.887411117553711, -12.27272891998291, -11.65804672241211, -11.043363571166992, -10.428682327270508, -9.814000129699707, -9.199317932128906, -8.584634780883789, -7.969952583312988, -7.3552703857421875, -6.740588188171387, -6.125905513763428, -5.511222839355469, -4.896540641784668, -4.281857967376709, -3.667175769805908, -3.0524933338165283, -2.4378108978271484, -1.8231287002563477, -1.2084460258483887, -0.5937638282775879, 0.020918548107147217, 0.6356009244918823, 1.2502832412719727, 1.8649656772613525, 2.4796481132507324, 3.094330310821533, 3.709012985229492, 4.323695182800293, 4.938377380371094, 5.553060054779053, 6.1677422523498535, 6.7824249267578125, 7.397107124328613, 8.011789321899414, 8.626472473144531, 9.241153717041016, 9.855835914611816, 10.470518112182617, 11.085201263427734, 11.699883460998535, 12.314565658569336, 12.929247856140137, 13.543930053710938, 14.158613204956055]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 2.0, 5.0, 6.0, 6.0, 6.0, 9.0, 12.0, 24.0, 23.0, 27.0, 26.0, 26.0, 30.0, 33.0, 32.0, 44.0, 43.0, 45.0, 36.0, 54.0, 36.0, 51.0, 48.0, 45.0, 48.0, 34.0, 36.0, 29.0, 34.0, 28.0, 25.0, 14.0, 14.0, 9.0, 13.0, 5.0, 12.0, 12.0, 5.0, 8.0, 2.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.813680648803711, -11.383864402770996, -10.954048156738281, -10.524232864379883, -10.094416618347168, -9.664600372314453, -9.234784126281738, -8.804967880249023, -8.375152587890625, -7.94533634185791, -7.5155205726623535, -7.085704326629639, -6.655888557434082, -6.226072311401367, -5.796256065368652, -5.366440296173096, -4.936624050140381, -4.506807804107666, -4.076992034912109, -3.6471757888793945, -3.217360019683838, -2.787543773651123, -2.3577277660369873, -1.9279117584228516, -1.4980957508087158, -1.06827974319458, -0.6384636759757996, -0.20864760875701904, 0.2211683988571167, 0.650984525680542, 1.0808005332946777, 1.5106165409088135, 1.9404325485229492, 2.370248556137085, 2.8000645637512207, 3.2298808097839355, 3.659696578979492, 4.089512825012207, 4.519329071044922, 4.9491448402404785, 5.378960609436035, 5.80877685546875, 6.238592624664307, 6.6684088706970215, 7.098224639892578, 7.528040885925293, 7.957857131958008, 8.387672424316406, 8.817489624023438, 9.247305870056152, 9.677122116088867, 10.106937408447266, 10.53675365447998, 10.966569900512695, 11.39638614654541, 11.826202392578125, 12.256017684936523, 12.685833930969238, 13.115650177001953, 13.545465469360352, 13.975281715393066, 14.405097961425781, 14.834914207458496, 15.264730453491211, 15.69454574584961]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 7.0, 9.0, 15.0, 35.0, 60.0, 126.0, 280.0, 795.0, 2357.0, 10621.0, 85296.0, 697423.0, 224015.0, 21455.0, 4162.0, 1144.0, 424.0, 167.0, 68.0, 39.0, 22.0, 18.0, 5.0, 6.0, 5.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.9296875, -9.4920654296875, -9.054443359375, -8.6168212890625, -8.17919921875, -7.7415771484375, -7.303955078125, -6.8663330078125, -6.4287109375, -5.9910888671875, -5.553466796875, -5.1158447265625, -4.67822265625, -4.2406005859375, -3.802978515625, -3.3653564453125, -2.927734375, -2.4901123046875, -2.052490234375, -1.6148681640625, -1.17724609375, -0.7396240234375, -0.302001953125, 0.1356201171875, 0.5732421875, 1.0108642578125, 1.448486328125, 1.8861083984375, 2.32373046875, 2.7613525390625, 3.198974609375, 3.6365966796875, 4.07421875, 4.5118408203125, 4.949462890625, 5.3870849609375, 5.82470703125, 6.2623291015625, 6.699951171875, 7.1375732421875, 7.5751953125, 8.0128173828125, 8.450439453125, 8.8880615234375, 9.32568359375, 9.7633056640625, 10.200927734375, 10.6385498046875, 11.076171875, 11.5137939453125, 11.951416015625, 12.3890380859375, 12.82666015625, 13.2642822265625, 13.701904296875, 14.1395263671875, 14.5771484375, 15.0147705078125, 15.452392578125, 15.8900146484375, 16.32763671875, 16.7652587890625, 17.202880859375, 17.6405029296875, 18.078125]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 4.0, 3.0, 5.0, 3.0, 4.0, 6.0, 7.0, 10.0, 17.0, 25.0, 25.0, 30.0, 41.0, 33.0, 56.0, 55.0, 65.0, 68.0, 75.0, 71.0, 64.0, 61.0, 56.0, 41.0, 43.0, 32.0, 21.0, 18.0, 15.0, 12.0, 5.0, 9.0, 5.0, 4.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-4.59765625, -4.47406005859375, -4.3504638671875, -4.22686767578125, -4.103271484375, -3.97967529296875, -3.8560791015625, -3.73248291015625, -3.60888671875, -3.48529052734375, -3.3616943359375, -3.23809814453125, -3.114501953125, -2.99090576171875, -2.8673095703125, -2.74371337890625, -2.6201171875, -2.49652099609375, -2.3729248046875, -2.24932861328125, -2.125732421875, -2.00213623046875, -1.8785400390625, -1.75494384765625, -1.63134765625, -1.50775146484375, -1.3841552734375, -1.26055908203125, -1.136962890625, -1.01336669921875, -0.8897705078125, -0.76617431640625, -0.642578125, -0.51898193359375, -0.3953857421875, -0.27178955078125, -0.148193359375, -0.02459716796875, 0.0989990234375, 0.22259521484375, 0.34619140625, 0.46978759765625, 0.5933837890625, 0.71697998046875, 0.840576171875, 0.96417236328125, 1.0877685546875, 1.21136474609375, 1.3349609375, 1.45855712890625, 1.5821533203125, 1.70574951171875, 1.829345703125, 1.95294189453125, 2.0765380859375, 2.20013427734375, 2.32373046875, 2.44732666015625, 2.5709228515625, 2.69451904296875, 2.818115234375, 2.94171142578125, 3.0653076171875, 3.18890380859375, 3.3125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 5.0, 9.0, 4.0, 13.0, 13.0, 21.0, 43.0, 46.0, 63.0, 129.0, 249.0, 510.0, 1196.0, 3268.0, 12793.0, 94489.0, 725717.0, 182705.0, 19970.0, 4441.0, 1548.0, 595.0, 312.0, 139.0, 83.0, 56.0, 43.0, 31.0, 10.0, 18.0, 9.0, 8.0, 5.0, 5.0, 0.0, 0.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.7109375, -13.30322265625, -12.8955078125, -12.48779296875, -12.080078125, -11.67236328125, -11.2646484375, -10.85693359375, -10.44921875, -10.04150390625, -9.6337890625, -9.22607421875, -8.818359375, -8.41064453125, -8.0029296875, -7.59521484375, -7.1875, -6.77978515625, -6.3720703125, -5.96435546875, -5.556640625, -5.14892578125, -4.7412109375, -4.33349609375, -3.92578125, -3.51806640625, -3.1103515625, -2.70263671875, -2.294921875, -1.88720703125, -1.4794921875, -1.07177734375, -0.6640625, -0.25634765625, 0.1513671875, 0.55908203125, 0.966796875, 1.37451171875, 1.7822265625, 2.18994140625, 2.59765625, 3.00537109375, 3.4130859375, 3.82080078125, 4.228515625, 4.63623046875, 5.0439453125, 5.45166015625, 5.859375, 6.26708984375, 6.6748046875, 7.08251953125, 7.490234375, 7.89794921875, 8.3056640625, 8.71337890625, 9.12109375, 9.52880859375, 9.9365234375, 10.34423828125, 10.751953125, 11.15966796875, 11.5673828125, 11.97509765625, 12.3828125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 4.0, 4.0, 2.0, 9.0, 15.0, 8.0, 11.0, 13.0, 17.0, 23.0, 31.0, 22.0, 31.0, 40.0, 53.0, 35.0, 38.0, 49.0, 63.0, 54.0, 51.0, 58.0, 40.0, 37.0, 35.0, 46.0, 39.0, 31.0, 26.0, 21.0, 17.0, 17.0, 11.0, 8.0, 14.0, 9.0, 6.0, 7.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0], "bins": [-16.15625, -15.7005615234375, -15.244873046875, -14.7891845703125, -14.33349609375, -13.8778076171875, -13.422119140625, -12.9664306640625, -12.5107421875, -12.0550537109375, -11.599365234375, -11.1436767578125, -10.68798828125, -10.2322998046875, -9.776611328125, -9.3209228515625, -8.865234375, -8.4095458984375, -7.953857421875, -7.4981689453125, -7.04248046875, -6.5867919921875, -6.131103515625, -5.6754150390625, -5.2197265625, -4.7640380859375, -4.308349609375, -3.8526611328125, -3.39697265625, -2.9412841796875, -2.485595703125, -2.0299072265625, -1.57421875, -1.1185302734375, -0.662841796875, -0.2071533203125, 0.24853515625, 0.7042236328125, 1.159912109375, 1.6156005859375, 2.0712890625, 2.5269775390625, 2.982666015625, 3.4383544921875, 3.89404296875, 4.3497314453125, 4.805419921875, 5.2611083984375, 5.716796875, 6.1724853515625, 6.628173828125, 7.0838623046875, 7.53955078125, 7.9952392578125, 8.450927734375, 8.9066162109375, 9.3623046875, 9.8179931640625, 10.273681640625, 10.7293701171875, 11.18505859375, 11.6407470703125, 12.096435546875, 12.5521240234375, 13.0078125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 3.0, 1.0, 2.0, 6.0, 1.0, 8.0, 12.0, 18.0, 31.0, 32.0, 58.0, 76.0, 150.0, 274.0, 558.0, 1529.0, 6622.0, 90667.0, 884506.0, 56434.0, 5099.0, 1308.0, 524.0, 257.0, 134.0, 79.0, 58.0, 38.0, 18.0, 16.0, 9.0, 11.0, 6.0, 6.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.15234375, -5.95660400390625, -5.7608642578125, -5.56512451171875, -5.369384765625, -5.17364501953125, -4.9779052734375, -4.78216552734375, -4.58642578125, -4.39068603515625, -4.1949462890625, -3.99920654296875, -3.803466796875, -3.60772705078125, -3.4119873046875, -3.21624755859375, -3.0205078125, -2.82476806640625, -2.6290283203125, -2.43328857421875, -2.237548828125, -2.04180908203125, -1.8460693359375, -1.65032958984375, -1.45458984375, -1.25885009765625, -1.0631103515625, -0.86737060546875, -0.671630859375, -0.47589111328125, -0.2801513671875, -0.08441162109375, 0.111328125, 0.30706787109375, 0.5028076171875, 0.69854736328125, 0.894287109375, 1.09002685546875, 1.2857666015625, 1.48150634765625, 1.67724609375, 1.87298583984375, 2.0687255859375, 2.26446533203125, 2.460205078125, 2.65594482421875, 2.8516845703125, 3.04742431640625, 3.2431640625, 3.43890380859375, 3.6346435546875, 3.83038330078125, 4.026123046875, 4.22186279296875, 4.4176025390625, 4.61334228515625, 4.80908203125, 5.00482177734375, 5.2005615234375, 5.39630126953125, 5.592041015625, 5.78778076171875, 5.9835205078125, 6.17926025390625, 6.375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 9.0, 10.0, 12.0, 44.0, 58.0, 135.0, 188.0, 246.0, 138.0, 84.0, 40.0, 15.0, 14.0, 9.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00211334228515625, -0.002069428563117981, -0.002025514841079712, -0.001981601119041443, -0.0019376873970031738, -0.0018937736749649048, -0.0018498599529266357, -0.0018059462308883667, -0.0017620325088500977, -0.0017181187868118286, -0.0016742050647735596, -0.0016302913427352905, -0.0015863776206970215, -0.0015424638986587524, -0.0014985501766204834, -0.0014546364545822144, -0.0014107227325439453, -0.0013668090105056763, -0.0013228952884674072, -0.0012789815664291382, -0.0012350678443908691, -0.0011911541223526, -0.001147240400314331, -0.001103326678276062, -0.001059412956237793, -0.001015499234199524, -0.0009715855121612549, -0.0009276717901229858, -0.0008837580680847168, -0.0008398443460464478, -0.0007959306240081787, -0.0007520169019699097, -0.0007081031799316406, -0.0006641894578933716, -0.0006202757358551025, -0.0005763620138168335, -0.0005324482917785645, -0.0004885345697402954, -0.00044462084770202637, -0.0004007071256637573, -0.0003567934036254883, -0.00031287968158721924, -0.0002689659595489502, -0.00022505223751068115, -0.0001811385154724121, -0.00013722479343414307, -9.331107139587402e-05, -4.939734935760498e-05, -5.4836273193359375e-06, 3.8430094718933105e-05, 8.234381675720215e-05, 0.0001262575387954712, 0.00017017126083374023, 0.00021408498287200928, 0.0002579987049102783, 0.00030191242694854736, 0.0003458261489868164, 0.00038973987102508545, 0.0004336535930633545, 0.00047756731510162354, 0.0005214810371398926, 0.0005653947591781616, 0.0006093084812164307, 0.0006532222032546997, 0.0006971359252929688]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 8.0, 6.0, 11.0, 18.0, 26.0, 48.0, 95.0, 138.0, 269.0, 598.0, 1578.0, 6099.0, 56740.0, 853405.0, 117199.0, 8854.0, 1997.0, 724.0, 330.0, 167.0, 94.0, 49.0, 30.0, 22.0, 17.0, 12.0, 7.0, 2.0, 6.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.0859375, -5.91009521484375, -5.7342529296875, -5.55841064453125, -5.382568359375, -5.20672607421875, -5.0308837890625, -4.85504150390625, -4.67919921875, -4.50335693359375, -4.3275146484375, -4.15167236328125, -3.975830078125, -3.79998779296875, -3.6241455078125, -3.44830322265625, -3.2724609375, -3.09661865234375, -2.9207763671875, -2.74493408203125, -2.569091796875, -2.39324951171875, -2.2174072265625, -2.04156494140625, -1.86572265625, -1.68988037109375, -1.5140380859375, -1.33819580078125, -1.162353515625, -0.98651123046875, -0.8106689453125, -0.63482666015625, -0.458984375, -0.28314208984375, -0.1072998046875, 0.06854248046875, 0.244384765625, 0.42022705078125, 0.5960693359375, 0.77191162109375, 0.94775390625, 1.12359619140625, 1.2994384765625, 1.47528076171875, 1.651123046875, 1.82696533203125, 2.0028076171875, 2.17864990234375, 2.3544921875, 2.53033447265625, 2.7061767578125, 2.88201904296875, 3.057861328125, 3.23370361328125, 3.4095458984375, 3.58538818359375, 3.76123046875, 3.93707275390625, 4.1129150390625, 4.28875732421875, 4.464599609375, 4.64044189453125, 4.8162841796875, 4.99212646484375, 5.16796875]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 4.0, 4.0, 8.0, 7.0, 11.0, 12.0, 8.0, 23.0, 35.0, 43.0, 77.0, 71.0, 111.0, 107.0, 118.0, 103.0, 79.0, 60.0, 32.0, 30.0, 30.0, 13.0, 10.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.70703125, -4.56365966796875, -4.4202880859375, -4.27691650390625, -4.133544921875, -3.99017333984375, -3.8468017578125, -3.70343017578125, -3.56005859375, -3.41668701171875, -3.2733154296875, -3.12994384765625, -2.986572265625, -2.84320068359375, -2.6998291015625, -2.55645751953125, -2.4130859375, -2.26971435546875, -2.1263427734375, -1.98297119140625, -1.839599609375, -1.69622802734375, -1.5528564453125, -1.40948486328125, -1.26611328125, -1.12274169921875, -0.9793701171875, -0.83599853515625, -0.692626953125, -0.54925537109375, -0.4058837890625, -0.26251220703125, -0.119140625, 0.02423095703125, 0.1676025390625, 0.31097412109375, 0.454345703125, 0.59771728515625, 0.7410888671875, 0.88446044921875, 1.02783203125, 1.17120361328125, 1.3145751953125, 1.45794677734375, 1.601318359375, 1.74468994140625, 1.8880615234375, 2.03143310546875, 2.1748046875, 2.31817626953125, 2.4615478515625, 2.60491943359375, 2.748291015625, 2.89166259765625, 3.0350341796875, 3.17840576171875, 3.32177734375, 3.46514892578125, 3.6085205078125, 3.75189208984375, 3.895263671875, 4.03863525390625, 4.1820068359375, 4.32537841796875, 4.46875]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 9.0, 15.0, 46.0, 87.0, 173.0, 270.0, 206.0, 112.0, 52.0, 26.0, 9.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-178.2339324951172, -174.05209350585938, -169.8702392578125, -165.6884002685547, -161.50656127929688, -157.32470703125, -153.1428680419922, -148.9610137939453, -144.7791748046875, -140.5973358154297, -136.4154815673828, -132.233642578125, -128.05178833007812, -123.86994934082031, -119.6881103515625, -115.50626373291016, -111.32441711425781, -107.14257049560547, -102.96072387695312, -98.77888488769531, -94.59703826904297, -90.41519165039062, -86.23335266113281, -82.05150604248047, -77.86965942382812, -73.68781280517578, -69.50596618652344, -65.32412719726562, -61.14228057861328, -56.96043395996094, -52.77859115600586, -48.59674835205078, -44.4149169921875, -40.233070373535156, -36.05122756958008, -31.869382858276367, -27.687538146972656, -23.505693435668945, -19.323848724365234, -15.142004013061523, -10.960159301757812, -6.778314590454102, -2.5964698791503906, 1.5853748321533203, 5.767219543457031, 9.949064254760742, 14.130908966064453, 18.312753677368164, 22.494598388671875, 26.676443099975586, 30.858287811279297, 35.040130615234375, 39.22197723388672, 43.40382385253906, 47.58566665649414, 51.76750946044922, 55.94935607910156, 60.131202697753906, 64.31304931640625, 68.49488830566406, 72.6767349243164, 76.85858154296875, 81.04042053222656, 85.2222671508789, 89.40411376953125]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 2.0, 1.0, 4.0, 8.0, 5.0, 14.0, 9.0, 10.0, 18.0, 17.0, 21.0, 28.0, 24.0, 38.0, 36.0, 47.0, 44.0, 37.0, 48.0, 57.0, 48.0, 69.0, 58.0, 37.0, 54.0, 50.0, 38.0, 31.0, 29.0, 29.0, 17.0, 16.0, 17.0, 14.0, 9.0, 7.0, 3.0, 7.0, 2.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.782127380371094, -48.71908950805664, -46.65605163574219, -44.593013763427734, -42.52997589111328, -40.46693801879883, -38.403900146484375, -36.34086227416992, -34.27782440185547, -32.214786529541016, -30.151748657226562, -28.08871078491211, -26.025672912597656, -23.962635040283203, -21.89959716796875, -19.836559295654297, -17.773521423339844, -15.71048355102539, -13.647445678710938, -11.584407806396484, -9.521369934082031, -7.458332061767578, -5.395294189453125, -3.332256317138672, -1.2692184448242188, 0.7938194274902344, 2.8568572998046875, 4.919895172119141, 6.982933044433594, 9.045970916748047, 11.1090087890625, 13.172046661376953, 15.235076904296875, 17.298114776611328, 19.36115264892578, 21.424190521240234, 23.487228393554688, 25.55026626586914, 27.613304138183594, 29.676342010498047, 31.7393798828125, 33.80241775512695, 35.865455627441406, 37.92849349975586, 39.99153137207031, 42.054569244384766, 44.11760711669922, 46.18064498901367, 48.243682861328125, 50.30672073364258, 52.36975860595703, 54.432796478271484, 56.49583435058594, 58.55887222290039, 60.621910095214844, 62.6849479675293, 64.74798583984375, 66.81101989746094, 68.87406158447266, 70.93710327148438, 73.00013732910156, 75.06317138671875, 77.12621307373047, 79.18925476074219, 81.25228881835938]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 4.0, 3.0, 3.0, 3.0, 4.0, 9.0, 12.0, 16.0, 22.0, 32.0, 67.0, 86.0, 195.0, 487.0, 1349.0, 4831.0, 28553.0, 1505011.0, 2610299.0, 35585.0, 5659.0, 1342.0, 415.0, 182.0, 56.0, 32.0, 14.0, 9.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.890625, -15.53778076171875, -15.1849365234375, -14.83209228515625, -14.479248046875, -14.12640380859375, -13.7735595703125, -13.42071533203125, -13.06787109375, -12.71502685546875, -12.3621826171875, -12.00933837890625, -11.656494140625, -11.30364990234375, -10.9508056640625, -10.59796142578125, -10.2451171875, -9.89227294921875, -9.5394287109375, -9.18658447265625, -8.833740234375, -8.48089599609375, -8.1280517578125, -7.77520751953125, -7.42236328125, -7.06951904296875, -6.7166748046875, -6.36383056640625, -6.010986328125, -5.65814208984375, -5.3052978515625, -4.95245361328125, -4.599609375, -4.24676513671875, -3.8939208984375, -3.54107666015625, -3.188232421875, -2.83538818359375, -2.4825439453125, -2.12969970703125, -1.77685546875, -1.42401123046875, -1.0711669921875, -0.71832275390625, -0.365478515625, -0.01263427734375, 0.3402099609375, 0.69305419921875, 1.0458984375, 1.39874267578125, 1.7515869140625, 2.10443115234375, 2.457275390625, 2.81011962890625, 3.1629638671875, 3.51580810546875, 3.86865234375, 4.22149658203125, 4.5743408203125, 4.92718505859375, 5.280029296875, 5.63287353515625, 5.9857177734375, 6.33856201171875, 6.69140625]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 8.0, 9.0, 19.0, 19.0, 21.0, 41.0, 61.0, 72.0, 77.0, 90.0, 93.0, 94.0, 93.0, 88.0, 53.0, 60.0, 37.0, 30.0, 18.0, 8.0, 7.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0], "bins": [-7.453125, -7.2972412109375, -7.141357421875, -6.9854736328125, -6.82958984375, -6.6737060546875, -6.517822265625, -6.3619384765625, -6.2060546875, -6.0501708984375, -5.894287109375, -5.7384033203125, -5.58251953125, -5.4266357421875, -5.270751953125, -5.1148681640625, -4.958984375, -4.8031005859375, -4.647216796875, -4.4913330078125, -4.33544921875, -4.1795654296875, -4.023681640625, -3.8677978515625, -3.7119140625, -3.5560302734375, -3.400146484375, -3.2442626953125, -3.08837890625, -2.9324951171875, -2.776611328125, -2.6207275390625, -2.46484375, -2.3089599609375, -2.153076171875, -1.9971923828125, -1.84130859375, -1.6854248046875, -1.529541015625, -1.3736572265625, -1.2177734375, -1.0618896484375, -0.906005859375, -0.7501220703125, -0.59423828125, -0.4383544921875, -0.282470703125, -0.1265869140625, 0.029296875, 0.1851806640625, 0.341064453125, 0.4969482421875, 0.65283203125, 0.8087158203125, 0.964599609375, 1.1204833984375, 1.2763671875, 1.4322509765625, 1.588134765625, 1.7440185546875, 1.89990234375, 2.0557861328125, 2.211669921875, 2.3675537109375, 2.5234375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 6.0, 4.0, 13.0, 19.0, 33.0, 36.0, 108.0, 192.0, 477.0, 1475.0, 4973.0, 23655.0, 279534.0, 3764339.0, 101253.0, 13559.0, 3043.0, 903.0, 313.0, 155.0, 86.0, 42.0, 26.0, 9.0, 9.0, 8.0, 2.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-13.1953125, -12.8321533203125, -12.468994140625, -12.1058349609375, -11.74267578125, -11.3795166015625, -11.016357421875, -10.6531982421875, -10.2900390625, -9.9268798828125, -9.563720703125, -9.2005615234375, -8.83740234375, -8.4742431640625, -8.111083984375, -7.7479248046875, -7.384765625, -7.0216064453125, -6.658447265625, -6.2952880859375, -5.93212890625, -5.5689697265625, -5.205810546875, -4.8426513671875, -4.4794921875, -4.1163330078125, -3.753173828125, -3.3900146484375, -3.02685546875, -2.6636962890625, -2.300537109375, -1.9373779296875, -1.57421875, -1.2110595703125, -0.847900390625, -0.4847412109375, -0.12158203125, 0.2415771484375, 0.604736328125, 0.9678955078125, 1.3310546875, 1.6942138671875, 2.057373046875, 2.4205322265625, 2.78369140625, 3.1468505859375, 3.510009765625, 3.8731689453125, 4.236328125, 4.5994873046875, 4.962646484375, 5.3258056640625, 5.68896484375, 6.0521240234375, 6.415283203125, 6.7784423828125, 7.1416015625, 7.5047607421875, 7.867919921875, 8.2310791015625, 8.59423828125, 8.9573974609375, 9.320556640625, 9.6837158203125, 10.046875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 7.0, 8.0, 2.0, 10.0, 9.0, 13.0, 14.0, 24.0, 37.0, 42.0, 67.0, 111.0, 171.0, 350.0, 844.0, 1146.0, 521.0, 259.0, 135.0, 79.0, 44.0, 45.0, 35.0, 18.0, 20.0, 12.0, 15.0, 10.0, 4.0, 3.0, 1.0, 6.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.5546875, -7.30517578125, -7.0556640625, -6.80615234375, -6.556640625, -6.30712890625, -6.0576171875, -5.80810546875, -5.55859375, -5.30908203125, -5.0595703125, -4.81005859375, -4.560546875, -4.31103515625, -4.0615234375, -3.81201171875, -3.5625, -3.31298828125, -3.0634765625, -2.81396484375, -2.564453125, -2.31494140625, -2.0654296875, -1.81591796875, -1.56640625, -1.31689453125, -1.0673828125, -0.81787109375, -0.568359375, -0.31884765625, -0.0693359375, 0.18017578125, 0.4296875, 0.67919921875, 0.9287109375, 1.17822265625, 1.427734375, 1.67724609375, 1.9267578125, 2.17626953125, 2.42578125, 2.67529296875, 2.9248046875, 3.17431640625, 3.423828125, 3.67333984375, 3.9228515625, 4.17236328125, 4.421875, 4.67138671875, 4.9208984375, 5.17041015625, 5.419921875, 5.66943359375, 5.9189453125, 6.16845703125, 6.41796875, 6.66748046875, 6.9169921875, 7.16650390625, 7.416015625, 7.66552734375, 7.9150390625, 8.16455078125, 8.4140625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 4.0, 17.0, 10.0, 27.0, 62.0, 148.0, 213.0, 211.0, 165.0, 64.0, 32.0, 26.0, 7.0, 4.0, 2.0, 7.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.34654235839844, -73.52115631103516, -70.69577026367188, -67.87037658691406, -65.04499053955078, -62.2196044921875, -59.39421844482422, -56.56883239746094, -53.74344253540039, -50.91805648803711, -48.09266662597656, -45.26728057861328, -42.44189453125, -39.61650466918945, -36.79111862182617, -33.965728759765625, -31.140342712402344, -28.31495475769043, -25.489566802978516, -22.664180755615234, -19.83879280090332, -17.013404846191406, -14.188018798828125, -11.362630844116211, -8.537242889404297, -5.711855411529541, -2.886467933654785, -0.0610809326171875, 2.7643070220947266, 5.589694976806641, 8.415081024169922, 11.240468978881836, 14.065864562988281, 16.891252517700195, 19.71664047241211, 22.54202651977539, 25.367414474487305, 28.19280242919922, 31.0181884765625, 33.84357452392578, 36.66896438598633, 39.49435043334961, 42.319740295410156, 45.14512634277344, 47.97051239013672, 50.795902252197266, 53.62128829956055, 56.446678161621094, 59.272064208984375, 62.097450256347656, 64.92283630371094, 67.74822998046875, 70.57361602783203, 73.39900207519531, 76.2243881225586, 79.04977416992188, 81.87516784667969, 84.70055389404297, 87.52593994140625, 90.35133361816406, 93.17671966552734, 96.00210571289062, 98.8274917602539, 101.65287780761719, 104.47826385498047]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 2.0, 4.0, 8.0, 6.0, 13.0, 18.0, 12.0, 13.0, 16.0, 16.0, 24.0, 31.0, 30.0, 44.0, 37.0, 46.0, 46.0, 50.0, 44.0, 54.0, 49.0, 39.0, 36.0, 48.0, 32.0, 41.0, 38.0, 33.0, 26.0, 23.0, 27.0, 18.0, 22.0, 9.0, 10.0, 6.0, 9.0, 5.0, 6.0, 4.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.3267936706543, -31.235261917114258, -30.14373016357422, -29.052196502685547, -27.960664749145508, -26.86913299560547, -25.777599334716797, -24.686067581176758, -23.59453582763672, -22.50300407409668, -21.41147232055664, -20.31993865966797, -19.22840690612793, -18.13687515258789, -17.04534149169922, -15.95380973815918, -14.86227798461914, -13.770746231079102, -12.679213523864746, -11.58768081665039, -10.496149063110352, -9.404617309570312, -8.313084602355957, -7.22155237197876, -6.1300201416015625, -5.038487911224365, -3.946955680847168, -2.8554234504699707, -1.7638912200927734, -0.6723589897155762, 0.4191732406616211, 1.5107054710388184, 2.6022377014160156, 3.693769931793213, 4.78530216217041, 5.876834392547607, 6.968366622924805, 8.059898376464844, 9.1514310836792, 10.242963790893555, 11.334495544433594, 12.426027297973633, 13.517560005187988, 14.609092712402344, 15.700624465942383, 16.792156219482422, 17.883689880371094, 18.975221633911133, 20.066753387451172, 21.15828514099121, 22.24981689453125, 23.341350555419922, 24.43288230895996, 25.5244140625, 26.615947723388672, 27.70747947692871, 28.79901123046875, 29.89054298400879, 30.982074737548828, 32.0736083984375, 33.165138244628906, 34.25667190551758, 35.34820556640625, 36.439735412597656, 37.53126907348633]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 4.0, 7.0, 4.0, 8.0, 18.0, 24.0, 33.0, 34.0, 47.0, 110.0, 179.0, 287.0, 457.0, 837.0, 1569.0, 2975.0, 5919.0, 12229.0, 28188.0, 69237.0, 173111.0, 350700.0, 237048.0, 94605.0, 38703.0, 16588.0, 7503.0, 3719.0, 1967.0, 1004.0, 586.0, 318.0, 190.0, 133.0, 73.0, 42.0, 31.0, 29.0, 14.0, 11.0, 9.0, 4.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.88671875, -4.74578857421875, -4.6048583984375, -4.46392822265625, -4.322998046875, -4.18206787109375, -4.0411376953125, -3.90020751953125, -3.75927734375, -3.61834716796875, -3.4774169921875, -3.33648681640625, -3.195556640625, -3.05462646484375, -2.9136962890625, -2.77276611328125, -2.6318359375, -2.49090576171875, -2.3499755859375, -2.20904541015625, -2.068115234375, -1.92718505859375, -1.7862548828125, -1.64532470703125, -1.50439453125, -1.36346435546875, -1.2225341796875, -1.08160400390625, -0.940673828125, -0.79974365234375, -0.6588134765625, -0.51788330078125, -0.376953125, -0.23602294921875, -0.0950927734375, 0.04583740234375, 0.186767578125, 0.32769775390625, 0.4686279296875, 0.60955810546875, 0.75048828125, 0.89141845703125, 1.0323486328125, 1.17327880859375, 1.314208984375, 1.45513916015625, 1.5960693359375, 1.73699951171875, 1.8779296875, 2.01885986328125, 2.1597900390625, 2.30072021484375, 2.441650390625, 2.58258056640625, 2.7235107421875, 2.86444091796875, 3.00537109375, 3.14630126953125, 3.2872314453125, 3.42816162109375, 3.569091796875, 3.71002197265625, 3.8509521484375, 3.99188232421875, 4.1328125]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 2.0, 8.0, 3.0, 8.0, 13.0, 22.0, 17.0, 31.0, 27.0, 31.0, 31.0, 44.0, 44.0, 58.0, 56.0, 73.0, 62.0, 59.0, 60.0, 55.0, 45.0, 46.0, 47.0, 34.0, 34.0, 13.0, 27.0, 14.0, 13.0, 7.0, 7.0, 7.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.603515625, -3.49896240234375, -3.3944091796875, -3.28985595703125, -3.185302734375, -3.08074951171875, -2.9761962890625, -2.87164306640625, -2.76708984375, -2.66253662109375, -2.5579833984375, -2.45343017578125, -2.348876953125, -2.24432373046875, -2.1397705078125, -2.03521728515625, -1.9306640625, -1.82611083984375, -1.7215576171875, -1.61700439453125, -1.512451171875, -1.40789794921875, -1.3033447265625, -1.19879150390625, -1.09423828125, -0.98968505859375, -0.8851318359375, -0.78057861328125, -0.676025390625, -0.57147216796875, -0.4669189453125, -0.36236572265625, -0.2578125, -0.15325927734375, -0.0487060546875, 0.05584716796875, 0.160400390625, 0.26495361328125, 0.3695068359375, 0.47406005859375, 0.57861328125, 0.68316650390625, 0.7877197265625, 0.89227294921875, 0.996826171875, 1.10137939453125, 1.2059326171875, 1.31048583984375, 1.4150390625, 1.51959228515625, 1.6241455078125, 1.72869873046875, 1.833251953125, 1.93780517578125, 2.0423583984375, 2.14691162109375, 2.25146484375, 2.35601806640625, 2.4605712890625, 2.56512451171875, 2.669677734375, 2.77423095703125, 2.8787841796875, 2.98333740234375, 3.087890625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 8.0, 2.0, 7.0, 8.0, 8.0, 16.0, 22.0, 31.0, 46.0, 76.0, 106.0, 170.0, 278.0, 408.0, 696.0, 1196.0, 2337.0, 5742.0, 20876.0, 117176.0, 654661.0, 199181.0, 31414.0, 7778.0, 2837.0, 1417.0, 849.0, 430.0, 295.0, 176.0, 95.0, 84.0, 52.0, 22.0, 18.0, 10.0, 10.0, 7.0, 7.0, 5.0, 3.0, 3.0, 1.0, 2.0], "bins": [-11.34375, -11.0645751953125, -10.785400390625, -10.5062255859375, -10.22705078125, -9.9478759765625, -9.668701171875, -9.3895263671875, -9.1103515625, -8.8311767578125, -8.552001953125, -8.2728271484375, -7.99365234375, -7.7144775390625, -7.435302734375, -7.1561279296875, -6.876953125, -6.5977783203125, -6.318603515625, -6.0394287109375, -5.76025390625, -5.4810791015625, -5.201904296875, -4.9227294921875, -4.6435546875, -4.3643798828125, -4.085205078125, -3.8060302734375, -3.52685546875, -3.2476806640625, -2.968505859375, -2.6893310546875, -2.41015625, -2.1309814453125, -1.851806640625, -1.5726318359375, -1.29345703125, -1.0142822265625, -0.735107421875, -0.4559326171875, -0.1767578125, 0.1024169921875, 0.381591796875, 0.6607666015625, 0.93994140625, 1.2191162109375, 1.498291015625, 1.7774658203125, 2.056640625, 2.3358154296875, 2.614990234375, 2.8941650390625, 3.17333984375, 3.4525146484375, 3.731689453125, 4.0108642578125, 4.2900390625, 4.5692138671875, 4.848388671875, 5.1275634765625, 5.40673828125, 5.6859130859375, 5.965087890625, 6.2442626953125, 6.5234375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 2.0, 13.0, 8.0, 10.0, 13.0, 16.0, 22.0, 22.0, 18.0, 26.0, 31.0, 33.0, 46.0, 44.0, 48.0, 44.0, 43.0, 46.0, 61.0, 48.0, 50.0, 41.0, 54.0, 24.0, 31.0, 29.0, 29.0, 31.0, 15.0, 14.0, 14.0, 14.0, 16.0, 6.0, 13.0, 5.0, 1.0, 6.0, 4.0, 1.0, 5.0, 0.0, 5.0, 2.0], "bins": [-15.7265625, -15.3177490234375, -14.908935546875, -14.5001220703125, -14.09130859375, -13.6824951171875, -13.273681640625, -12.8648681640625, -12.4560546875, -12.0472412109375, -11.638427734375, -11.2296142578125, -10.82080078125, -10.4119873046875, -10.003173828125, -9.5943603515625, -9.185546875, -8.7767333984375, -8.367919921875, -7.9591064453125, -7.55029296875, -7.1414794921875, -6.732666015625, -6.3238525390625, -5.9150390625, -5.5062255859375, -5.097412109375, -4.6885986328125, -4.27978515625, -3.8709716796875, -3.462158203125, -3.0533447265625, -2.64453125, -2.2357177734375, -1.826904296875, -1.4180908203125, -1.00927734375, -0.6004638671875, -0.191650390625, 0.2171630859375, 0.6259765625, 1.0347900390625, 1.443603515625, 1.8524169921875, 2.26123046875, 2.6700439453125, 3.078857421875, 3.4876708984375, 3.896484375, 4.3052978515625, 4.714111328125, 5.1229248046875, 5.53173828125, 5.9405517578125, 6.349365234375, 6.7581787109375, 7.1669921875, 7.5758056640625, 7.984619140625, 8.3934326171875, 8.80224609375, 9.2110595703125, 9.619873046875, 10.0286865234375, 10.4375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 6.0, 7.0, 12.0, 11.0, 21.0, 44.0, 49.0, 112.0, 255.0, 590.0, 2068.0, 12500.0, 254487.0, 743270.0, 29970.0, 3609.0, 897.0, 313.0, 134.0, 77.0, 46.0, 28.0, 12.0, 17.0, 6.0, 8.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.91015625, -4.7474365234375, -4.584716796875, -4.4219970703125, -4.25927734375, -4.0965576171875, -3.933837890625, -3.7711181640625, -3.6083984375, -3.4456787109375, -3.282958984375, -3.1202392578125, -2.95751953125, -2.7947998046875, -2.632080078125, -2.4693603515625, -2.306640625, -2.1439208984375, -1.981201171875, -1.8184814453125, -1.65576171875, -1.4930419921875, -1.330322265625, -1.1676025390625, -1.0048828125, -0.8421630859375, -0.679443359375, -0.5167236328125, -0.35400390625, -0.1912841796875, -0.028564453125, 0.1341552734375, 0.296875, 0.4595947265625, 0.622314453125, 0.7850341796875, 0.94775390625, 1.1104736328125, 1.273193359375, 1.4359130859375, 1.5986328125, 1.7613525390625, 1.924072265625, 2.0867919921875, 2.24951171875, 2.4122314453125, 2.574951171875, 2.7376708984375, 2.900390625, 3.0631103515625, 3.225830078125, 3.3885498046875, 3.55126953125, 3.7139892578125, 3.876708984375, 4.0394287109375, 4.2021484375, 4.3648681640625, 4.527587890625, 4.6903076171875, 4.85302734375, 5.0157470703125, 5.178466796875, 5.3411865234375, 5.50390625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 2.0, 5.0, 5.0, 9.0, 10.0, 9.0, 16.0, 11.0, 22.0, 30.0, 36.0, 47.0, 47.0, 68.0, 79.0, 84.0, 82.0, 89.0, 65.0, 57.0, 31.0, 42.0, 41.0, 22.0, 22.0, 15.0, 12.0, 13.0, 9.0, 5.0, 4.0, 4.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004367828369140625, -0.0004205256700515747, -0.0004042685031890869, -0.0003880113363265991, -0.00037175416946411133, -0.00035549700260162354, -0.00033923983573913574, -0.00032298266887664795, -0.00030672550201416016, -0.00029046833515167236, -0.00027421116828918457, -0.0002579540014266968, -0.00024169683456420898, -0.0002254396677017212, -0.0002091825008392334, -0.0001929253339767456, -0.0001766681671142578, -0.00016041100025177002, -0.00014415383338928223, -0.00012789666652679443, -0.00011163949966430664, -9.538233280181885e-05, -7.912516593933105e-05, -6.286799907684326e-05, -4.661083221435547e-05, -3.0353665351867676e-05, -1.4096498489379883e-05, 2.16066837310791e-06, 1.8417835235595703e-05, 3.4675002098083496e-05, 5.093216896057129e-05, 6.718933582305908e-05, 8.344650268554688e-05, 9.970366954803467e-05, 0.00011596083641052246, 0.00013221800327301025, 0.00014847517013549805, 0.00016473233699798584, 0.00018098950386047363, 0.00019724667072296143, 0.00021350383758544922, 0.000229761004447937, 0.0002460181713104248, 0.0002622753381729126, 0.0002785325050354004, 0.0002947896718978882, 0.000311046838760376, 0.00032730400562286377, 0.00034356117248535156, 0.00035981833934783936, 0.00037607550621032715, 0.00039233267307281494, 0.00040858983993530273, 0.00042484700679779053, 0.0004411041736602783, 0.0004573613405227661, 0.0004736185073852539, 0.0004898756742477417, 0.0005061328411102295, 0.0005223900079727173, 0.0005386471748352051, 0.0005549043416976929, 0.0005711615085601807, 0.0005874186754226685, 0.0006036758422851562]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 6.0, 4.0, 8.0, 7.0, 21.0, 48.0, 64.0, 155.0, 323.0, 879.0, 2846.0, 15471.0, 284235.0, 704982.0, 32954.0, 4526.0, 1223.0, 425.0, 165.0, 95.0, 50.0, 19.0, 20.0, 14.0, 9.0, 3.0, 4.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.30078125, -5.1541748046875, -5.007568359375, -4.8609619140625, -4.71435546875, -4.5677490234375, -4.421142578125, -4.2745361328125, -4.1279296875, -3.9813232421875, -3.834716796875, -3.6881103515625, -3.54150390625, -3.3948974609375, -3.248291015625, -3.1016845703125, -2.955078125, -2.8084716796875, -2.661865234375, -2.5152587890625, -2.36865234375, -2.2220458984375, -2.075439453125, -1.9288330078125, -1.7822265625, -1.6356201171875, -1.489013671875, -1.3424072265625, -1.19580078125, -1.0491943359375, -0.902587890625, -0.7559814453125, -0.609375, -0.4627685546875, -0.316162109375, -0.1695556640625, -0.02294921875, 0.1236572265625, 0.270263671875, 0.4168701171875, 0.5634765625, 0.7100830078125, 0.856689453125, 1.0032958984375, 1.14990234375, 1.2965087890625, 1.443115234375, 1.5897216796875, 1.736328125, 1.8829345703125, 2.029541015625, 2.1761474609375, 2.32275390625, 2.4693603515625, 2.615966796875, 2.7625732421875, 2.9091796875, 3.0557861328125, 3.202392578125, 3.3489990234375, 3.49560546875, 3.6422119140625, 3.788818359375, 3.9354248046875, 4.08203125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 2.0, 6.0, 6.0, 10.0, 6.0, 15.0, 21.0, 29.0, 28.0, 49.0, 55.0, 63.0, 59.0, 72.0, 84.0, 77.0, 78.0, 69.0, 60.0, 40.0, 43.0, 34.0, 33.0, 23.0, 9.0, 9.0, 5.0, 10.0, 8.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.888671875, -2.795196533203125, -2.70172119140625, -2.608245849609375, -2.5147705078125, -2.421295166015625, -2.32781982421875, -2.234344482421875, -2.140869140625, -2.047393798828125, -1.95391845703125, -1.860443115234375, -1.7669677734375, -1.673492431640625, -1.58001708984375, -1.486541748046875, -1.39306640625, -1.299591064453125, -1.20611572265625, -1.112640380859375, -1.0191650390625, -0.925689697265625, -0.83221435546875, -0.738739013671875, -0.645263671875, -0.551788330078125, -0.45831298828125, -0.364837646484375, -0.2713623046875, -0.177886962890625, -0.08441162109375, 0.009063720703125, 0.1025390625, 0.196014404296875, 0.28948974609375, 0.382965087890625, 0.4764404296875, 0.569915771484375, 0.66339111328125, 0.756866455078125, 0.850341796875, 0.943817138671875, 1.03729248046875, 1.130767822265625, 1.2242431640625, 1.317718505859375, 1.41119384765625, 1.504669189453125, 1.59814453125, 1.691619873046875, 1.78509521484375, 1.878570556640625, 1.9720458984375, 2.065521240234375, 2.15899658203125, 2.252471923828125, 2.345947265625, 2.439422607421875, 2.53289794921875, 2.626373291015625, 2.7198486328125, 2.813323974609375, 2.90679931640625, 3.000274658203125, 3.09375]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 6.0, 7.0, 7.0, 12.0, 22.0, 47.0, 84.0, 135.0, 199.0, 192.0, 141.0, 76.0, 35.0, 18.0, 4.0, 7.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.604705810546875, -59.14763641357422, -56.69056701660156, -54.233497619628906, -51.77642822265625, -49.319358825683594, -46.8622932434082, -44.40522384643555, -41.94815444946289, -39.491085052490234, -37.03401565551758, -34.57694625854492, -32.11988067626953, -29.662809371948242, -27.20574188232422, -24.748672485351562, -22.291603088378906, -19.83453369140625, -17.377464294433594, -14.92039680480957, -12.463327407836914, -10.006258010864258, -7.549189567565918, -5.092121124267578, -2.635051727294922, -0.17798280715942383, 2.279086112976074, 4.736155033111572, 7.19322395324707, 9.650293350219727, 12.107361793518066, 14.564430236816406, 17.02149200439453, 19.478561401367188, 21.935630798339844, 24.392698287963867, 26.849767684936523, 29.30683708190918, 31.763904571533203, 34.22097396850586, 36.678043365478516, 39.13511276245117, 41.59218215942383, 44.049251556396484, 46.506317138671875, 48.96338653564453, 51.42045593261719, 53.877525329589844, 56.3345947265625, 58.791664123535156, 61.24873352050781, 63.70580291748047, 66.16287231445312, 68.61994171142578, 71.07701110839844, 73.53407287597656, 75.99114990234375, 78.4482192993164, 80.90528869628906, 83.36235809326172, 85.81942749023438, 88.27649688720703, 90.73356628417969, 93.19062805175781, 95.64769744873047]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 5.0, 8.0, 9.0, 12.0, 17.0, 15.0, 19.0, 21.0, 25.0, 26.0, 23.0, 32.0, 26.0, 30.0, 33.0, 39.0, 46.0, 52.0, 45.0, 55.0, 66.0, 42.0, 41.0, 39.0, 32.0, 42.0, 23.0, 30.0, 24.0, 8.0, 20.0, 17.0, 14.0, 11.0, 10.0, 10.0, 11.0, 6.0, 4.0, 2.0, 2.0, 1.0, 3.0, 5.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-46.37994384765625, -44.93372344970703, -43.48750686645508, -42.04128646850586, -40.595069885253906, -39.14884948730469, -37.70262908935547, -36.256412506103516, -34.8101921081543, -33.36397171020508, -31.917755126953125, -30.471534729003906, -29.02531623840332, -27.579097747802734, -26.13287925720215, -24.686660766601562, -23.240442276000977, -21.79422378540039, -20.348005294799805, -18.90178680419922, -17.45556640625, -16.009347915649414, -14.563129425048828, -13.116909980773926, -11.67069149017334, -10.224472999572754, -8.778253555297852, -7.332035064697266, -5.8858160972595215, -4.439597129821777, -2.9933786392211914, -1.547159194946289, -0.10094070434570312, 1.3452781438827515, 2.791496992111206, 4.237715721130371, 5.683934688568115, 7.130153656005859, 8.576372146606445, 10.022591590881348, 11.468810081481934, 12.91502857208252, 14.361248016357422, 15.807466506958008, 17.253684997558594, 18.699905395507812, 20.146121978759766, 21.592342376708984, 23.03856086730957, 24.484779357910156, 25.930997848510742, 27.377216339111328, 28.823436737060547, 30.269655227661133, 31.71587371826172, 33.16209411621094, 34.60831069946289, 36.05453109741211, 37.50074768066406, 38.94696807861328, 40.393184661865234, 41.83940505981445, 43.285621643066406, 44.731842041015625, 46.178062438964844]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 3.0, 0.0, 3.0, 7.0, 6.0, 3.0, 12.0, 12.0, 18.0, 33.0, 37.0, 47.0, 78.0, 120.0, 180.0, 372.0, 962.0, 3483.0, 18902.0, 525415.0, 3582161.0, 52806.0, 6990.0, 1609.0, 488.0, 203.0, 102.0, 80.0, 41.0, 34.0, 20.0, 14.0, 13.0, 6.0, 10.0, 7.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.3984375, -9.1153564453125, -8.832275390625, -8.5491943359375, -8.26611328125, -7.9830322265625, -7.699951171875, -7.4168701171875, -7.1337890625, -6.8507080078125, -6.567626953125, -6.2845458984375, -6.00146484375, -5.7183837890625, -5.435302734375, -5.1522216796875, -4.869140625, -4.5860595703125, -4.302978515625, -4.0198974609375, -3.73681640625, -3.4537353515625, -3.170654296875, -2.8875732421875, -2.6044921875, -2.3214111328125, -2.038330078125, -1.7552490234375, -1.47216796875, -1.1890869140625, -0.906005859375, -0.6229248046875, -0.33984375, -0.0567626953125, 0.226318359375, 0.5093994140625, 0.79248046875, 1.0755615234375, 1.358642578125, 1.6417236328125, 1.9248046875, 2.2078857421875, 2.490966796875, 2.7740478515625, 3.05712890625, 3.3402099609375, 3.623291015625, 3.9063720703125, 4.189453125, 4.4725341796875, 4.755615234375, 5.0386962890625, 5.32177734375, 5.6048583984375, 5.887939453125, 6.1710205078125, 6.4541015625, 6.7371826171875, 7.020263671875, 7.3033447265625, 7.58642578125, 7.8695068359375, 8.152587890625, 8.4356689453125, 8.71875]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 2.0, 9.0, 15.0, 24.0, 32.0, 35.0, 56.0, 69.0, 88.0, 99.0, 101.0, 108.0, 93.0, 74.0, 59.0, 52.0, 23.0, 31.0, 14.0, 11.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.0546875, -6.896209716796875, -6.73773193359375, -6.579254150390625, -6.4207763671875, -6.262298583984375, -6.10382080078125, -5.945343017578125, -5.786865234375, -5.628387451171875, -5.46990966796875, -5.311431884765625, -5.1529541015625, -4.994476318359375, -4.83599853515625, -4.677520751953125, -4.51904296875, -4.360565185546875, -4.20208740234375, -4.043609619140625, -3.8851318359375, -3.726654052734375, -3.56817626953125, -3.409698486328125, -3.251220703125, -3.092742919921875, -2.93426513671875, -2.775787353515625, -2.6173095703125, -2.458831787109375, -2.30035400390625, -2.141876220703125, -1.9833984375, -1.824920654296875, -1.66644287109375, -1.507965087890625, -1.3494873046875, -1.191009521484375, -1.03253173828125, -0.874053955078125, -0.715576171875, -0.557098388671875, -0.39862060546875, -0.240142822265625, -0.0816650390625, 0.076812744140625, 0.23529052734375, 0.393768310546875, 0.55224609375, 0.710723876953125, 0.86920166015625, 1.027679443359375, 1.1861572265625, 1.344635009765625, 1.50311279296875, 1.661590576171875, 1.820068359375, 1.978546142578125, 2.13702392578125, 2.295501708984375, 2.4539794921875, 2.612457275390625, 2.77093505859375, 2.929412841796875, 3.087890625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 7.0, 6.0, 7.0, 12.0, 25.0, 39.0, 60.0, 89.0, 162.0, 292.0, 617.0, 1528.0, 4463.0, 15850.0, 85045.0, 2623962.0, 1376225.0, 66378.0, 13550.0, 3683.0, 1253.0, 497.0, 260.0, 134.0, 57.0, 35.0, 22.0, 13.0, 6.0, 7.0, 2.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.359375, -8.126708984375, -7.89404296875, -7.661376953125, -7.4287109375, -7.196044921875, -6.96337890625, -6.730712890625, -6.498046875, -6.265380859375, -6.03271484375, -5.800048828125, -5.5673828125, -5.334716796875, -5.10205078125, -4.869384765625, -4.63671875, -4.404052734375, -4.17138671875, -3.938720703125, -3.7060546875, -3.473388671875, -3.24072265625, -3.008056640625, -2.775390625, -2.542724609375, -2.31005859375, -2.077392578125, -1.8447265625, -1.612060546875, -1.37939453125, -1.146728515625, -0.9140625, -0.681396484375, -0.44873046875, -0.216064453125, 0.0166015625, 0.249267578125, 0.48193359375, 0.714599609375, 0.947265625, 1.179931640625, 1.41259765625, 1.645263671875, 1.8779296875, 2.110595703125, 2.34326171875, 2.575927734375, 2.80859375, 3.041259765625, 3.27392578125, 3.506591796875, 3.7392578125, 3.971923828125, 4.20458984375, 4.437255859375, 4.669921875, 4.902587890625, 5.13525390625, 5.367919921875, 5.6005859375, 5.833251953125, 6.06591796875, 6.298583984375, 6.53125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 6.0, 5.0, 7.0, 13.0, 13.0, 24.0, 32.0, 47.0, 86.0, 134.0, 403.0, 915.0, 1186.0, 588.0, 255.0, 128.0, 75.0, 45.0, 44.0, 19.0, 19.0, 11.0, 7.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.0234375, -9.76788330078125, -9.5123291015625, -9.25677490234375, -9.001220703125, -8.74566650390625, -8.4901123046875, -8.23455810546875, -7.97900390625, -7.72344970703125, -7.4678955078125, -7.21234130859375, -6.956787109375, -6.70123291015625, -6.4456787109375, -6.19012451171875, -5.9345703125, -5.67901611328125, -5.4234619140625, -5.16790771484375, -4.912353515625, -4.65679931640625, -4.4012451171875, -4.14569091796875, -3.89013671875, -3.63458251953125, -3.3790283203125, -3.12347412109375, -2.867919921875, -2.61236572265625, -2.3568115234375, -2.10125732421875, -1.845703125, -1.59014892578125, -1.3345947265625, -1.07904052734375, -0.823486328125, -0.56793212890625, -0.3123779296875, -0.05682373046875, 0.19873046875, 0.45428466796875, 0.7098388671875, 0.96539306640625, 1.220947265625, 1.47650146484375, 1.7320556640625, 1.98760986328125, 2.2431640625, 2.49871826171875, 2.7542724609375, 3.00982666015625, 3.265380859375, 3.52093505859375, 3.7764892578125, 4.03204345703125, 4.28759765625, 4.54315185546875, 4.7987060546875, 5.05426025390625, 5.309814453125, 5.56536865234375, 5.8209228515625, 6.07647705078125, 6.33203125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 3.0, 17.0, 63.0, 281.0, 380.0, 177.0, 45.0, 16.0, 6.0, 4.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.29899597167969, -71.90971374511719, -68.52043914794922, -65.13115692138672, -61.74187469482422, -58.352596282958984, -54.96331787109375, -51.57403564453125, -48.18475341796875, -44.795475006103516, -41.406192779541016, -38.01691436767578, -34.62763214111328, -31.238353729248047, -27.84907341003418, -24.459793090820312, -21.070514678955078, -17.68123435974121, -14.291954040527344, -10.902674674987793, -7.513394355773926, -4.124114990234375, -0.7348346710205078, 2.6544456481933594, 6.043725967407227, 9.433006286621094, 12.822286605834961, 16.211566925048828, 19.600845336914062, 22.99012565612793, 26.379405975341797, 29.768686294555664, 33.15796661376953, 36.547245025634766, 39.936527252197266, 43.3258056640625, 46.715087890625, 50.104366302490234, 53.49364471435547, 56.88292694091797, 60.27220916748047, 63.6614875793457, 67.05076599121094, 70.44004821777344, 73.82933044433594, 77.21861267089844, 80.6078872680664, 83.9971694946289, 87.38644409179688, 90.77572631835938, 94.16500091552734, 97.55428314208984, 100.94356536865234, 104.33283996582031, 107.72212219238281, 111.11140441894531, 114.50068664550781, 117.88996887207031, 121.27924346923828, 124.66852569580078, 128.05780029296875, 131.44708251953125, 134.83636474609375, 138.22564697265625, 141.61492919921875]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 5.0, 2.0, 2.0, 3.0, 4.0, 2.0, 6.0, 8.0, 17.0, 10.0, 18.0, 21.0, 23.0, 23.0, 25.0, 32.0, 44.0, 37.0, 35.0, 34.0, 37.0, 54.0, 45.0, 46.0, 62.0, 52.0, 51.0, 45.0, 39.0, 27.0, 32.0, 40.0, 25.0, 27.0, 22.0, 11.0, 7.0, 12.0, 9.0, 9.0, 2.0, 5.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.39168930053711, -22.540687561035156, -21.68968391418457, -20.838682174682617, -19.98767852783203, -19.136676788330078, -18.285675048828125, -17.434673309326172, -16.583669662475586, -15.732666969299316, -14.881664276123047, -14.030662536621094, -13.179659843444824, -12.328657150268555, -11.477655410766602, -10.626652717590332, -9.775650024414062, -8.924647331237793, -8.073644638061523, -7.22264289855957, -6.371640205383301, -5.520637512207031, -4.66963529586792, -3.8186330795288086, -2.967630386352539, -2.1166279315948486, -1.2656254768371582, -0.4146230220794678, 0.43637943267822266, 1.2873821258544922, 2.1383843421936035, 2.989386558532715, 3.8403892517089844, 4.691391944885254, 5.542394161224365, 6.393396377563477, 7.244399070739746, 8.095401763916016, 8.946403503417969, 9.797406196594238, 10.648408889770508, 11.499411582946777, 12.350414276123047, 13.201416015625, 14.05241870880127, 14.903421401977539, 15.754423141479492, 16.605426788330078, 17.45642852783203, 18.307430267333984, 19.15843391418457, 20.009435653686523, 20.86043930053711, 21.711441040039062, 22.562442779541016, 23.41344451904297, 24.264448165893555, 25.115449905395508, 25.966453552246094, 26.817455291748047, 27.66845703125, 28.519460678100586, 29.37046241760254, 30.221466064453125, 31.072467803955078]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 9.0, 6.0, 14.0, 16.0, 12.0, 23.0, 42.0, 67.0, 108.0, 177.0, 317.0, 481.0, 822.0, 1452.0, 2775.0, 5243.0, 10785.0, 23157.0, 53552.0, 129573.0, 311975.0, 295027.0, 120449.0, 49451.0, 21753.0, 10165.0, 4984.0, 2613.0, 1422.0, 817.0, 498.0, 294.0, 183.0, 109.0, 64.0, 42.0, 17.0, 24.0, 17.0, 12.0, 6.0, 4.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.4296875, -4.2952880859375, -4.160888671875, -4.0264892578125, -3.89208984375, -3.7576904296875, -3.623291015625, -3.4888916015625, -3.3544921875, -3.2200927734375, -3.085693359375, -2.9512939453125, -2.81689453125, -2.6824951171875, -2.548095703125, -2.4136962890625, -2.279296875, -2.1448974609375, -2.010498046875, -1.8760986328125, -1.74169921875, -1.6072998046875, -1.472900390625, -1.3385009765625, -1.2041015625, -1.0697021484375, -0.935302734375, -0.8009033203125, -0.66650390625, -0.5321044921875, -0.397705078125, -0.2633056640625, -0.12890625, 0.0054931640625, 0.139892578125, 0.2742919921875, 0.40869140625, 0.5430908203125, 0.677490234375, 0.8118896484375, 0.9462890625, 1.0806884765625, 1.215087890625, 1.3494873046875, 1.48388671875, 1.6182861328125, 1.752685546875, 1.8870849609375, 2.021484375, 2.1558837890625, 2.290283203125, 2.4246826171875, 2.55908203125, 2.6934814453125, 2.827880859375, 2.9622802734375, 3.0966796875, 3.2310791015625, 3.365478515625, 3.4998779296875, 3.63427734375, 3.7686767578125, 3.903076171875, 4.0374755859375, 4.171875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 6.0, 6.0, 13.0, 8.0, 11.0, 11.0, 22.0, 40.0, 32.0, 46.0, 47.0, 45.0, 60.0, 64.0, 80.0, 79.0, 53.0, 66.0, 66.0, 56.0, 32.0, 37.0, 29.0, 28.0, 14.0, 20.0, 10.0, 2.0, 9.0, 5.0, 7.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.86328125, -4.747772216796875, -4.63226318359375, -4.516754150390625, -4.4012451171875, -4.285736083984375, -4.17022705078125, -4.054718017578125, -3.939208984375, -3.823699951171875, -3.70819091796875, -3.592681884765625, -3.4771728515625, -3.361663818359375, -3.24615478515625, -3.130645751953125, -3.01513671875, -2.899627685546875, -2.78411865234375, -2.668609619140625, -2.5531005859375, -2.437591552734375, -2.32208251953125, -2.206573486328125, -2.091064453125, -1.975555419921875, -1.86004638671875, -1.744537353515625, -1.6290283203125, -1.513519287109375, -1.39801025390625, -1.282501220703125, -1.1669921875, -1.051483154296875, -0.93597412109375, -0.820465087890625, -0.7049560546875, -0.589447021484375, -0.47393798828125, -0.358428955078125, -0.242919921875, -0.127410888671875, -0.01190185546875, 0.103607177734375, 0.2191162109375, 0.334625244140625, 0.45013427734375, 0.565643310546875, 0.68115234375, 0.796661376953125, 0.91217041015625, 1.027679443359375, 1.1431884765625, 1.258697509765625, 1.37420654296875, 1.489715576171875, 1.605224609375, 1.720733642578125, 1.83624267578125, 1.951751708984375, 2.0672607421875, 2.182769775390625, 2.29827880859375, 2.413787841796875, 2.529296875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 6.0, 5.0, 8.0, 7.0, 17.0, 12.0, 13.0, 32.0, 46.0, 66.0, 91.0, 152.0, 240.0, 389.0, 713.0, 1468.0, 3804.0, 12449.0, 57378.0, 397385.0, 489588.0, 63705.0, 13513.0, 4017.0, 1608.0, 742.0, 403.0, 237.0, 134.0, 96.0, 53.0, 42.0, 35.0, 29.0, 10.0, 16.0, 9.0, 8.0, 7.0, 5.0, 3.0, 0.0, 3.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.734375, -8.461669921875, -8.18896484375, -7.916259765625, -7.6435546875, -7.370849609375, -7.09814453125, -6.825439453125, -6.552734375, -6.280029296875, -6.00732421875, -5.734619140625, -5.4619140625, -5.189208984375, -4.91650390625, -4.643798828125, -4.37109375, -4.098388671875, -3.82568359375, -3.552978515625, -3.2802734375, -3.007568359375, -2.73486328125, -2.462158203125, -2.189453125, -1.916748046875, -1.64404296875, -1.371337890625, -1.0986328125, -0.825927734375, -0.55322265625, -0.280517578125, -0.0078125, 0.264892578125, 0.53759765625, 0.810302734375, 1.0830078125, 1.355712890625, 1.62841796875, 1.901123046875, 2.173828125, 2.446533203125, 2.71923828125, 2.991943359375, 3.2646484375, 3.537353515625, 3.81005859375, 4.082763671875, 4.35546875, 4.628173828125, 4.90087890625, 5.173583984375, 5.4462890625, 5.718994140625, 5.99169921875, 6.264404296875, 6.537109375, 6.809814453125, 7.08251953125, 7.355224609375, 7.6279296875, 7.900634765625, 8.17333984375, 8.446044921875, 8.71875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 2.0, 5.0, 1.0, 4.0, 9.0, 11.0, 14.0, 12.0, 21.0, 20.0, 20.0, 23.0, 42.0, 35.0, 38.0, 54.0, 56.0, 43.0, 66.0, 45.0, 49.0, 44.0, 45.0, 42.0, 49.0, 33.0, 38.0, 34.0, 21.0, 14.0, 21.0, 15.0, 8.0, 14.0, 11.0, 10.0, 9.0, 7.0, 4.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-11.09375, -10.7310791015625, -10.368408203125, -10.0057373046875, -9.64306640625, -9.2803955078125, -8.917724609375, -8.5550537109375, -8.1923828125, -7.8297119140625, -7.467041015625, -7.1043701171875, -6.74169921875, -6.3790283203125, -6.016357421875, -5.6536865234375, -5.291015625, -4.9283447265625, -4.565673828125, -4.2030029296875, -3.84033203125, -3.4776611328125, -3.114990234375, -2.7523193359375, -2.3896484375, -2.0269775390625, -1.664306640625, -1.3016357421875, -0.93896484375, -0.5762939453125, -0.213623046875, 0.1490478515625, 0.51171875, 0.8743896484375, 1.237060546875, 1.5997314453125, 1.96240234375, 2.3250732421875, 2.687744140625, 3.0504150390625, 3.4130859375, 3.7757568359375, 4.138427734375, 4.5010986328125, 4.86376953125, 5.2264404296875, 5.589111328125, 5.9517822265625, 6.314453125, 6.6771240234375, 7.039794921875, 7.4024658203125, 7.76513671875, 8.1278076171875, 8.490478515625, 8.8531494140625, 9.2158203125, 9.5784912109375, 9.941162109375, 10.3038330078125, 10.66650390625, 11.0291748046875, 11.391845703125, 11.7545166015625, 12.1171875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 5.0, 4.0, 4.0, 1.0, 7.0, 11.0, 11.0, 16.0, 18.0, 28.0, 40.0, 84.0, 140.0, 295.0, 651.0, 1927.0, 9834.0, 155340.0, 829057.0, 44020.0, 4759.0, 1272.0, 466.0, 222.0, 136.0, 60.0, 45.0, 32.0, 20.0, 11.0, 10.0, 11.0, 3.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.55078125, -4.3900146484375, -4.229248046875, -4.0684814453125, -3.90771484375, -3.7469482421875, -3.586181640625, -3.4254150390625, -3.2646484375, -3.1038818359375, -2.943115234375, -2.7823486328125, -2.62158203125, -2.4608154296875, -2.300048828125, -2.1392822265625, -1.978515625, -1.8177490234375, -1.656982421875, -1.4962158203125, -1.33544921875, -1.1746826171875, -1.013916015625, -0.8531494140625, -0.6923828125, -0.5316162109375, -0.370849609375, -0.2100830078125, -0.04931640625, 0.1114501953125, 0.272216796875, 0.4329833984375, 0.59375, 0.7545166015625, 0.915283203125, 1.0760498046875, 1.23681640625, 1.3975830078125, 1.558349609375, 1.7191162109375, 1.8798828125, 2.0406494140625, 2.201416015625, 2.3621826171875, 2.52294921875, 2.6837158203125, 2.844482421875, 3.0052490234375, 3.166015625, 3.3267822265625, 3.487548828125, 3.6483154296875, 3.80908203125, 3.9698486328125, 4.130615234375, 4.2913818359375, 4.4521484375, 4.6129150390625, 4.773681640625, 4.9344482421875, 5.09521484375, 5.2559814453125, 5.416748046875, 5.5775146484375, 5.73828125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 0.0, 3.0, 3.0, 2.0, 5.0, 1.0, 7.0, 7.0, 10.0, 9.0, 12.0, 15.0, 16.0, 28.0, 32.0, 28.0, 49.0, 65.0, 74.0, 74.0, 71.0, 77.0, 81.0, 60.0, 53.0, 47.0, 38.0, 25.0, 23.0, 23.0, 9.0, 14.0, 8.0, 8.0, 11.0, 4.0, 4.0, 4.0, 2.0, 1.0, 5.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004949569702148438, -0.00048040226101875305, -0.00046584755182266235, -0.00045129284262657166, -0.00043673813343048096, -0.00042218342423439026, -0.00040762871503829956, -0.00039307400584220886, -0.00037851929664611816, -0.00036396458745002747, -0.00034940987825393677, -0.00033485516905784607, -0.00032030045986175537, -0.00030574575066566467, -0.000291191041469574, -0.0002766363322734833, -0.0002620816230773926, -0.0002475269138813019, -0.00023297220468521118, -0.00021841749548912048, -0.00020386278629302979, -0.0001893080770969391, -0.0001747533679008484, -0.0001601986587047577, -0.000145643949508667, -0.0001310892403125763, -0.0001165345311164856, -0.0001019798219203949, -8.74251127243042e-05, -7.28704035282135e-05, -5.83156943321228e-05, -4.3760985136032104e-05, -2.9206275939941406e-05, -1.4651566743850708e-05, -9.685754776000977e-08, 1.4457851648330688e-05, 2.9012560844421387e-05, 4.3567270040512085e-05, 5.812197923660278e-05, 7.267668843269348e-05, 8.723139762878418e-05, 0.00010178610682487488, 0.00011634081602096558, 0.00013089552521705627, 0.00014545023441314697, 0.00016000494360923767, 0.00017455965280532837, 0.00018911436200141907, 0.00020366907119750977, 0.00021822378039360046, 0.00023277848958969116, 0.00024733319878578186, 0.00026188790798187256, 0.00027644261717796326, 0.00029099732637405396, 0.00030555203557014465, 0.00032010674476623535, 0.00033466145396232605, 0.00034921616315841675, 0.00036377087235450745, 0.00037832558155059814, 0.00039288029074668884, 0.00040743499994277954, 0.00042198970913887024, 0.00043654441833496094]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 2.0, 3.0, 5.0, 8.0, 4.0, 10.0, 14.0, 15.0, 23.0, 29.0, 35.0, 54.0, 77.0, 125.0, 194.0, 292.0, 490.0, 924.0, 1775.0, 4157.0, 12754.0, 59123.0, 373165.0, 500495.0, 71104.0, 14718.0, 4666.0, 1906.0, 933.0, 502.0, 317.0, 185.0, 136.0, 91.0, 69.0, 42.0, 22.0, 25.0, 16.0, 10.0, 10.0, 3.0, 7.0, 7.0, 3.0, 4.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.37890625, -2.29974365234375, -2.2205810546875, -2.14141845703125, -2.062255859375, -1.98309326171875, -1.9039306640625, -1.82476806640625, -1.74560546875, -1.66644287109375, -1.5872802734375, -1.50811767578125, -1.428955078125, -1.34979248046875, -1.2706298828125, -1.19146728515625, -1.1123046875, -1.03314208984375, -0.9539794921875, -0.87481689453125, -0.795654296875, -0.71649169921875, -0.6373291015625, -0.55816650390625, -0.47900390625, -0.39984130859375, -0.3206787109375, -0.24151611328125, -0.162353515625, -0.08319091796875, -0.0040283203125, 0.07513427734375, 0.154296875, 0.23345947265625, 0.3126220703125, 0.39178466796875, 0.470947265625, 0.55010986328125, 0.6292724609375, 0.70843505859375, 0.78759765625, 0.86676025390625, 0.9459228515625, 1.02508544921875, 1.104248046875, 1.18341064453125, 1.2625732421875, 1.34173583984375, 1.4208984375, 1.50006103515625, 1.5792236328125, 1.65838623046875, 1.737548828125, 1.81671142578125, 1.8958740234375, 1.97503662109375, 2.05419921875, 2.13336181640625, 2.2125244140625, 2.29168701171875, 2.370849609375, 2.45001220703125, 2.5291748046875, 2.60833740234375, 2.6875]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 6.0, 5.0, 7.0, 8.0, 13.0, 18.0, 31.0, 34.0, 36.0, 58.0, 67.0, 65.0, 103.0, 98.0, 86.0, 80.0, 80.0, 49.0, 35.0, 33.0, 25.0, 21.0, 14.0, 9.0, 9.0, 5.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.02734375, -3.927490234375, -3.82763671875, -3.727783203125, -3.6279296875, -3.528076171875, -3.42822265625, -3.328369140625, -3.228515625, -3.128662109375, -3.02880859375, -2.928955078125, -2.8291015625, -2.729248046875, -2.62939453125, -2.529541015625, -2.4296875, -2.329833984375, -2.22998046875, -2.130126953125, -2.0302734375, -1.930419921875, -1.83056640625, -1.730712890625, -1.630859375, -1.531005859375, -1.43115234375, -1.331298828125, -1.2314453125, -1.131591796875, -1.03173828125, -0.931884765625, -0.83203125, -0.732177734375, -0.63232421875, -0.532470703125, -0.4326171875, -0.332763671875, -0.23291015625, -0.133056640625, -0.033203125, 0.066650390625, 0.16650390625, 0.266357421875, 0.3662109375, 0.466064453125, 0.56591796875, 0.665771484375, 0.765625, 0.865478515625, 0.96533203125, 1.065185546875, 1.1650390625, 1.264892578125, 1.36474609375, 1.464599609375, 1.564453125, 1.664306640625, 1.76416015625, 1.864013671875, 1.9638671875, 2.063720703125, 2.16357421875, 2.263427734375, 2.36328125]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 3.0, 1.0, 3.0, 15.0, 16.0, 43.0, 90.0, 176.0, 238.0, 200.0, 113.0, 49.0, 31.0, 13.0, 7.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-88.62583923339844, -86.14532470703125, -83.66480255126953, -81.18428802490234, -78.70377349853516, -76.22325134277344, -73.74273681640625, -71.26222229003906, -68.78170013427734, -66.30118560791016, -63.8206672668457, -61.34014892578125, -58.8596305847168, -56.379112243652344, -53.898597717285156, -51.4180793762207, -48.937564849853516, -46.45704650878906, -43.976531982421875, -41.49601364135742, -39.01549530029297, -36.53498077392578, -34.05446243286133, -31.573944091796875, -29.093427658081055, -26.612911224365234, -24.13239288330078, -21.65187644958496, -19.17136001586914, -16.690841674804688, -14.210325241088867, -11.729806900024414, -9.249290466308594, -6.768773078918457, -4.2882561683654785, -1.8077392578125, 0.6727781295776367, 3.1532955169677734, 5.633811950683594, 8.114330291748047, 10.594846725463867, 13.075364112854004, 15.55588150024414, 18.03639793395996, 20.51691436767578, 22.997432708740234, 25.477949142456055, 27.958467483520508, 30.438983917236328, 32.91950225830078, 35.40001678466797, 37.88053512573242, 40.361053466796875, 42.84156799316406, 45.322086334228516, 47.80260467529297, 50.283119201660156, 52.76363754272461, 55.2441520690918, 57.72467041015625, 60.2051887512207, 62.685707092285156, 65.16622161865234, 67.64674377441406, 70.12725830078125]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 7.0, 2.0, 9.0, 14.0, 8.0, 16.0, 23.0, 31.0, 32.0, 29.0, 45.0, 41.0, 64.0, 79.0, 90.0, 81.0, 85.0, 62.0, 51.0, 60.0, 51.0, 35.0, 26.0, 18.0, 12.0, 12.0, 9.0, 9.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-79.71756744384766, -77.67255401611328, -75.6275405883789, -73.58252716064453, -71.53751373291016, -69.49250030517578, -67.4474868774414, -65.4024658203125, -63.35745620727539, -61.312442779541016, -59.26742935180664, -57.222415924072266, -55.177398681640625, -53.13238525390625, -51.087371826171875, -49.0423583984375, -46.997344970703125, -44.95233154296875, -42.907318115234375, -40.8623046875, -38.817291259765625, -36.77227783203125, -34.72726058959961, -32.682247161865234, -30.63723373413086, -28.592220306396484, -26.54720687866211, -24.5021915435791, -22.457178115844727, -20.41216468811035, -18.367149353027344, -16.32213592529297, -14.277130126953125, -12.23211669921875, -10.187102317810059, -8.142087936401367, -6.097074508666992, -4.052061080932617, -2.007046699523926, 0.037967681884765625, 2.0829811096191406, 4.127995014190674, 6.173008918762207, 8.218023300170898, 10.263036727905273, 12.308050155639648, 14.35306453704834, 16.39807891845703, 18.443092346191406, 20.48810577392578, 22.533119201660156, 24.578134536743164, 26.62314796447754, 28.668161392211914, 30.713176727294922, 32.7581901550293, 34.80320358276367, 36.84821701049805, 38.89323043823242, 40.9382438659668, 42.98326110839844, 45.02827453613281, 47.07328796386719, 49.11830139160156, 51.16331481933594]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 4.0, 3.0, 6.0, 2.0, 3.0, 10.0, 11.0, 10.0, 16.0, 33.0, 71.0, 108.0, 238.0, 769.0, 2658.0, 11199.0, 93501.0, 2808926.0, 1214785.0, 49895.0, 8456.0, 2391.0, 788.0, 263.0, 80.0, 26.0, 17.0, 7.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.640625, -7.448974609375, -7.25732421875, -7.065673828125, -6.8740234375, -6.682373046875, -6.49072265625, -6.299072265625, -6.107421875, -5.915771484375, -5.72412109375, -5.532470703125, -5.3408203125, -5.149169921875, -4.95751953125, -4.765869140625, -4.57421875, -4.382568359375, -4.19091796875, -3.999267578125, -3.8076171875, -3.615966796875, -3.42431640625, -3.232666015625, -3.041015625, -2.849365234375, -2.65771484375, -2.466064453125, -2.2744140625, -2.082763671875, -1.89111328125, -1.699462890625, -1.5078125, -1.316162109375, -1.12451171875, -0.932861328125, -0.7412109375, -0.549560546875, -0.35791015625, -0.166259765625, 0.025390625, 0.217041015625, 0.40869140625, 0.600341796875, 0.7919921875, 0.983642578125, 1.17529296875, 1.366943359375, 1.55859375, 1.750244140625, 1.94189453125, 2.133544921875, 2.3251953125, 2.516845703125, 2.70849609375, 2.900146484375, 3.091796875, 3.283447265625, 3.47509765625, 3.666748046875, 3.8583984375, 4.050048828125, 4.24169921875, 4.433349609375, 4.625]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 10.0, 14.0, 20.0, 26.0, 50.0, 66.0, 86.0, 99.0, 119.0, 93.0, 110.0, 85.0, 80.0, 56.0, 47.0, 23.0, 15.0, 11.0, 4.0, 4.0, 1.0], "bins": [-9.0, -8.827606201171875, -8.65521240234375, -8.482818603515625, -8.3104248046875, -8.138031005859375, -7.96563720703125, -7.793243408203125, -7.620849609375, -7.448455810546875, -7.27606201171875, -7.103668212890625, -6.9312744140625, -6.758880615234375, -6.58648681640625, -6.414093017578125, -6.24169921875, -6.069305419921875, -5.89691162109375, -5.724517822265625, -5.5521240234375, -5.379730224609375, -5.20733642578125, -5.034942626953125, -4.862548828125, -4.690155029296875, -4.51776123046875, -4.345367431640625, -4.1729736328125, -4.000579833984375, -3.82818603515625, -3.655792236328125, -3.4833984375, -3.311004638671875, -3.13861083984375, -2.966217041015625, -2.7938232421875, -2.621429443359375, -2.44903564453125, -2.276641845703125, -2.104248046875, -1.931854248046875, -1.75946044921875, -1.587066650390625, -1.4146728515625, -1.242279052734375, -1.06988525390625, -0.897491455078125, -0.72509765625, -0.552703857421875, -0.38031005859375, -0.207916259765625, -0.0355224609375, 0.136871337890625, 0.30926513671875, 0.481658935546875, 0.654052734375, 0.826446533203125, 0.99884033203125, 1.171234130859375, 1.3436279296875, 1.516021728515625, 1.68841552734375, 1.860809326171875, 2.033203125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 7.0, 4.0, 4.0, 4.0, 9.0, 5.0, 19.0, 20.0, 43.0, 44.0, 83.0, 130.0, 280.0, 442.0, 974.0, 2000.0, 5491.0, 18611.0, 94008.0, 1909949.0, 2042175.0, 95746.0, 16935.0, 4397.0, 1554.0, 591.0, 323.0, 168.0, 111.0, 63.0, 32.0, 27.0, 19.0, 10.0, 1.0, 5.0, 4.0, 2.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.69140625, -7.48358154296875, -7.2757568359375, -7.06793212890625, -6.860107421875, -6.65228271484375, -6.4444580078125, -6.23663330078125, -6.02880859375, -5.82098388671875, -5.6131591796875, -5.40533447265625, -5.197509765625, -4.98968505859375, -4.7818603515625, -4.57403564453125, -4.3662109375, -4.15838623046875, -3.9505615234375, -3.74273681640625, -3.534912109375, -3.32708740234375, -3.1192626953125, -2.91143798828125, -2.70361328125, -2.49578857421875, -2.2879638671875, -2.08013916015625, -1.872314453125, -1.66448974609375, -1.4566650390625, -1.24884033203125, -1.041015625, -0.83319091796875, -0.6253662109375, -0.41754150390625, -0.209716796875, -0.00189208984375, 0.2059326171875, 0.41375732421875, 0.62158203125, 0.82940673828125, 1.0372314453125, 1.24505615234375, 1.452880859375, 1.66070556640625, 1.8685302734375, 2.07635498046875, 2.2841796875, 2.49200439453125, 2.6998291015625, 2.90765380859375, 3.115478515625, 3.32330322265625, 3.5311279296875, 3.73895263671875, 3.94677734375, 4.15460205078125, 4.3624267578125, 4.57025146484375, 4.778076171875, 4.98590087890625, 5.1937255859375, 5.40155029296875, 5.609375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 7.0, 7.0, 5.0, 3.0, 10.0, 9.0, 17.0, 20.0, 29.0, 51.0, 59.0, 110.0, 187.0, 303.0, 697.0, 1007.0, 711.0, 319.0, 196.0, 115.0, 70.0, 47.0, 32.0, 19.0, 17.0, 7.0, 7.0, 8.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.78125, -10.521728515625, -10.26220703125, -10.002685546875, -9.7431640625, -9.483642578125, -9.22412109375, -8.964599609375, -8.705078125, -8.445556640625, -8.18603515625, -7.926513671875, -7.6669921875, -7.407470703125, -7.14794921875, -6.888427734375, -6.62890625, -6.369384765625, -6.10986328125, -5.850341796875, -5.5908203125, -5.331298828125, -5.07177734375, -4.812255859375, -4.552734375, -4.293212890625, -4.03369140625, -3.774169921875, -3.5146484375, -3.255126953125, -2.99560546875, -2.736083984375, -2.4765625, -2.217041015625, -1.95751953125, -1.697998046875, -1.4384765625, -1.178955078125, -0.91943359375, -0.659912109375, -0.400390625, -0.140869140625, 0.11865234375, 0.378173828125, 0.6376953125, 0.897216796875, 1.15673828125, 1.416259765625, 1.67578125, 1.935302734375, 2.19482421875, 2.454345703125, 2.7138671875, 2.973388671875, 3.23291015625, 3.492431640625, 3.751953125, 4.011474609375, 4.27099609375, 4.530517578125, 4.7900390625, 5.049560546875, 5.30908203125, 5.568603515625, 5.828125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 7.0, 23.0, 41.0, 107.0, 212.0, 224.0, 186.0, 95.0, 44.0, 22.0, 12.0, 6.0, 4.0, 3.0, 2.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.46714401245117, -52.03287124633789, -49.598602294921875, -47.164329528808594, -44.73005676269531, -42.29578399658203, -39.86151123046875, -37.427242279052734, -34.99296951293945, -32.55869674682617, -30.124425888061523, -27.690155029296875, -25.255882263183594, -22.821609497070312, -20.387338638305664, -17.953067779541016, -15.518795013427734, -13.08452320098877, -10.650251388549805, -8.21597957611084, -5.781707763671875, -3.34743595123291, -0.9131641387939453, 1.5211067199707031, 3.9553794860839844, 6.389651298522949, 8.823923110961914, 11.258194923400879, 13.692466735839844, 16.126739501953125, 18.561010360717773, 20.995281219482422, 23.429550170898438, 25.86382293701172, 28.298093795776367, 30.732364654541016, 33.1666374206543, 35.60091018676758, 38.035179138183594, 40.469451904296875, 42.903724670410156, 45.33799743652344, 47.77227020263672, 50.206539154052734, 52.640811920166016, 55.0750846862793, 57.50935363769531, 59.943626403808594, 62.377899169921875, 64.81217193603516, 67.24644470214844, 69.68071746826172, 72.114990234375, 74.54925537109375, 76.98352813720703, 79.41780090332031, 81.8520736694336, 84.28634643554688, 86.72061920166016, 89.15489196777344, 91.58915710449219, 94.02342987060547, 96.45770263671875, 98.89197540283203, 101.32624816894531]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 3.0, 4.0, 2.0, 4.0, 8.0, 12.0, 11.0, 10.0, 21.0, 27.0, 40.0, 32.0, 49.0, 65.0, 65.0, 66.0, 52.0, 63.0, 63.0, 54.0, 56.0, 53.0, 50.0, 54.0, 30.0, 28.0, 23.0, 16.0, 19.0, 10.0, 3.0, 9.0, 6.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.337627410888672, -22.94782829284668, -21.558029174804688, -20.168228149414062, -18.77842903137207, -17.388629913330078, -15.99882984161377, -14.609029769897461, -13.219230651855469, -11.829431533813477, -10.439631462097168, -9.04983139038086, -7.660032272338867, -6.270232677459717, -4.880433082580566, -3.490633010864258, -2.1008338928222656, -0.7110342979431152, 0.6787652969360352, 2.0685648918151855, 3.458364486694336, 4.848164081573486, 6.237963676452637, 7.627763748168945, 9.017562866210938, 10.40736198425293, 11.797162055969238, 13.186962127685547, 14.576761245727539, 15.966560363769531, 17.356361389160156, 18.74616050720215, 20.135955810546875, 21.525754928588867, 22.91555404663086, 24.305355072021484, 25.695154190063477, 27.08495330810547, 28.474754333496094, 29.864553451538086, 31.254352569580078, 32.6441535949707, 34.03395080566406, 35.42375183105469, 36.81355285644531, 38.20335006713867, 39.5931510925293, 40.982948303222656, 42.37274932861328, 43.762550354003906, 45.152347564697266, 46.54214859008789, 47.93194580078125, 49.321746826171875, 50.7115478515625, 52.101348876953125, 53.491146087646484, 54.88094711303711, 56.27074432373047, 57.660545349121094, 59.05034637451172, 60.44014358520508, 61.8299446105957, 63.21974182128906, 64.60954284667969]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 5.0, 6.0, 9.0, 15.0, 25.0, 37.0, 67.0, 98.0, 152.0, 255.0, 427.0, 893.0, 1796.0, 3879.0, 8885.0, 20418.0, 49583.0, 115667.0, 249243.0, 307357.0, 164525.0, 71653.0, 30142.0, 12834.0, 5450.0, 2504.0, 1197.0, 587.0, 345.0, 188.0, 123.0, 74.0, 36.0, 27.0, 16.0, 17.0, 10.0, 3.0, 4.0, 1.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.21875, -4.102264404296875, -3.98577880859375, -3.869293212890625, -3.7528076171875, -3.636322021484375, -3.51983642578125, -3.403350830078125, -3.286865234375, -3.170379638671875, -3.05389404296875, -2.937408447265625, -2.8209228515625, -2.704437255859375, -2.58795166015625, -2.471466064453125, -2.35498046875, -2.238494873046875, -2.12200927734375, -2.005523681640625, -1.8890380859375, -1.772552490234375, -1.65606689453125, -1.539581298828125, -1.423095703125, -1.306610107421875, -1.19012451171875, -1.073638916015625, -0.9571533203125, -0.840667724609375, -0.72418212890625, -0.607696533203125, -0.4912109375, -0.374725341796875, -0.25823974609375, -0.141754150390625, -0.0252685546875, 0.091217041015625, 0.20770263671875, 0.324188232421875, 0.440673828125, 0.557159423828125, 0.67364501953125, 0.790130615234375, 0.9066162109375, 1.023101806640625, 1.13958740234375, 1.256072998046875, 1.37255859375, 1.489044189453125, 1.60552978515625, 1.722015380859375, 1.8385009765625, 1.954986572265625, 2.07147216796875, 2.187957763671875, 2.304443359375, 2.420928955078125, 2.53741455078125, 2.653900146484375, 2.7703857421875, 2.886871337890625, 3.00335693359375, 3.119842529296875, 3.236328125]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 3.0, 6.0, 4.0, 7.0, 8.0, 8.0, 6.0, 15.0, 15.0, 18.0, 25.0, 32.0, 33.0, 28.0, 32.0, 31.0, 33.0, 49.0, 53.0, 57.0, 40.0, 46.0, 40.0, 52.0, 59.0, 35.0, 31.0, 48.0, 32.0, 31.0, 27.0, 21.0, 17.0, 14.0, 15.0, 6.0, 10.0, 6.0, 7.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-2.7578125, -2.683013916015625, -2.60821533203125, -2.533416748046875, -2.4586181640625, -2.383819580078125, -2.30902099609375, -2.234222412109375, -2.159423828125, -2.084625244140625, -2.00982666015625, -1.935028076171875, -1.8602294921875, -1.785430908203125, -1.71063232421875, -1.635833740234375, -1.56103515625, -1.486236572265625, -1.41143798828125, -1.336639404296875, -1.2618408203125, -1.187042236328125, -1.11224365234375, -1.037445068359375, -0.962646484375, -0.887847900390625, -0.81304931640625, -0.738250732421875, -0.6634521484375, -0.588653564453125, -0.51385498046875, -0.439056396484375, -0.3642578125, -0.289459228515625, -0.21466064453125, -0.139862060546875, -0.0650634765625, 0.009735107421875, 0.08453369140625, 0.159332275390625, 0.234130859375, 0.308929443359375, 0.38372802734375, 0.458526611328125, 0.5333251953125, 0.608123779296875, 0.68292236328125, 0.757720947265625, 0.83251953125, 0.907318115234375, 0.98211669921875, 1.056915283203125, 1.1317138671875, 1.206512451171875, 1.28131103515625, 1.356109619140625, 1.430908203125, 1.505706787109375, 1.58050537109375, 1.655303955078125, 1.7301025390625, 1.804901123046875, 1.87969970703125, 1.954498291015625, 2.029296875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 12.0, 13.0, 9.0, 19.0, 24.0, 34.0, 33.0, 62.0, 98.0, 140.0, 215.0, 304.0, 467.0, 838.0, 1613.0, 3669.0, 12913.0, 96128.0, 735207.0, 168263.0, 19238.0, 4725.0, 1892.0, 962.0, 565.0, 336.0, 245.0, 167.0, 113.0, 80.0, 51.0, 36.0, 28.0, 14.0, 11.0, 4.0, 7.0, 5.0, 4.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.84765625, -7.57342529296875, -7.2991943359375, -7.02496337890625, -6.750732421875, -6.47650146484375, -6.2022705078125, -5.92803955078125, -5.65380859375, -5.37957763671875, -5.1053466796875, -4.83111572265625, -4.556884765625, -4.28265380859375, -4.0084228515625, -3.73419189453125, -3.4599609375, -3.18572998046875, -2.9114990234375, -2.63726806640625, -2.363037109375, -2.08880615234375, -1.8145751953125, -1.54034423828125, -1.26611328125, -0.99188232421875, -0.7176513671875, -0.44342041015625, -0.169189453125, 0.10504150390625, 0.3792724609375, 0.65350341796875, 0.927734375, 1.20196533203125, 1.4761962890625, 1.75042724609375, 2.024658203125, 2.29888916015625, 2.5731201171875, 2.84735107421875, 3.12158203125, 3.39581298828125, 3.6700439453125, 3.94427490234375, 4.218505859375, 4.49273681640625, 4.7669677734375, 5.04119873046875, 5.3154296875, 5.58966064453125, 5.8638916015625, 6.13812255859375, 6.412353515625, 6.68658447265625, 6.9608154296875, 7.23504638671875, 7.50927734375, 7.78350830078125, 8.0577392578125, 8.33197021484375, 8.606201171875, 8.88043212890625, 9.1546630859375, 9.42889404296875, 9.703125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 9.0, 13.0, 12.0, 25.0, 19.0, 35.0, 43.0, 46.0, 77.0, 60.0, 73.0, 58.0, 79.0, 64.0, 74.0, 61.0, 57.0, 46.0, 34.0, 20.0, 28.0, 14.0, 14.0, 17.0, 12.0, 4.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.0234375, -11.5648193359375, -11.106201171875, -10.6475830078125, -10.18896484375, -9.7303466796875, -9.271728515625, -8.8131103515625, -8.3544921875, -7.8958740234375, -7.437255859375, -6.9786376953125, -6.52001953125, -6.0614013671875, -5.602783203125, -5.1441650390625, -4.685546875, -4.2269287109375, -3.768310546875, -3.3096923828125, -2.85107421875, -2.3924560546875, -1.933837890625, -1.4752197265625, -1.0166015625, -0.5579833984375, -0.099365234375, 0.3592529296875, 0.81787109375, 1.2764892578125, 1.735107421875, 2.1937255859375, 2.65234375, 3.1109619140625, 3.569580078125, 4.0281982421875, 4.48681640625, 4.9454345703125, 5.404052734375, 5.8626708984375, 6.3212890625, 6.7799072265625, 7.238525390625, 7.6971435546875, 8.15576171875, 8.6143798828125, 9.072998046875, 9.5316162109375, 9.990234375, 10.4488525390625, 10.907470703125, 11.3660888671875, 11.82470703125, 12.2833251953125, 12.741943359375, 13.2005615234375, 13.6591796875, 14.1177978515625, 14.576416015625, 15.0350341796875, 15.49365234375, 15.9522705078125, 16.410888671875, 16.8695068359375, 17.328125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 5.0, 0.0, 1.0, 6.0, 3.0, 9.0, 19.0, 28.0, 42.0, 79.0, 169.0, 397.0, 1063.0, 4706.0, 51401.0, 887357.0, 94378.0, 6709.0, 1352.0, 438.0, 196.0, 93.0, 37.0, 25.0, 21.0, 15.0, 8.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.53515625, -4.400146484375, -4.26513671875, -4.130126953125, -3.9951171875, -3.860107421875, -3.72509765625, -3.590087890625, -3.455078125, -3.320068359375, -3.18505859375, -3.050048828125, -2.9150390625, -2.780029296875, -2.64501953125, -2.510009765625, -2.375, -2.239990234375, -2.10498046875, -1.969970703125, -1.8349609375, -1.699951171875, -1.56494140625, -1.429931640625, -1.294921875, -1.159912109375, -1.02490234375, -0.889892578125, -0.7548828125, -0.619873046875, -0.48486328125, -0.349853515625, -0.21484375, -0.079833984375, 0.05517578125, 0.190185546875, 0.3251953125, 0.460205078125, 0.59521484375, 0.730224609375, 0.865234375, 1.000244140625, 1.13525390625, 1.270263671875, 1.4052734375, 1.540283203125, 1.67529296875, 1.810302734375, 1.9453125, 2.080322265625, 2.21533203125, 2.350341796875, 2.4853515625, 2.620361328125, 2.75537109375, 2.890380859375, 3.025390625, 3.160400390625, 3.29541015625, 3.430419921875, 3.5654296875, 3.700439453125, 3.83544921875, 3.970458984375, 4.10546875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 3.0, 3.0, 11.0, 11.0, 11.0, 21.0, 17.0, 25.0, 22.0, 27.0, 48.0, 65.0, 75.0, 92.0, 92.0, 95.0, 76.0, 71.0, 45.0, 43.0, 33.0, 30.0, 17.0, 18.0, 8.0, 8.0, 7.0, 6.0, 2.0, 9.0, 1.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004858970642089844, -0.0004694536328315735, -0.0004530102014541626, -0.0004365667700767517, -0.0004201233386993408, -0.00040367990732192993, -0.00038723647594451904, -0.00037079304456710815, -0.00035434961318969727, -0.0003379061818122864, -0.0003214627504348755, -0.0003050193190574646, -0.0002885758876800537, -0.0002721324563026428, -0.00025568902492523193, -0.00023924559354782104, -0.00022280216217041016, -0.00020635873079299927, -0.00018991529941558838, -0.0001734718680381775, -0.0001570284366607666, -0.0001405850052833557, -0.00012414157390594482, -0.00010769814252853394, -9.125471115112305e-05, -7.481127977371216e-05, -5.836784839630127e-05, -4.192441701889038e-05, -2.5480985641479492e-05, -9.037554264068604e-06, 7.405877113342285e-06, 2.3849308490753174e-05, 4.029273986816406e-05, 5.673617124557495e-05, 7.317960262298584e-05, 8.962303400039673e-05, 0.00010606646537780762, 0.0001225098967552185, 0.0001389533281326294, 0.00015539675951004028, 0.00017184019088745117, 0.00018828362226486206, 0.00020472705364227295, 0.00022117048501968384, 0.00023761391639709473, 0.0002540573477745056, 0.0002705007791519165, 0.0002869442105293274, 0.0003033876419067383, 0.00031983107328414917, 0.00033627450466156006, 0.00035271793603897095, 0.00036916136741638184, 0.0003856047987937927, 0.0004020482301712036, 0.0004184916615486145, 0.0004349350929260254, 0.0004513785243034363, 0.00046782195568084717, 0.00048426538705825806, 0.0005007088184356689, 0.0005171522498130798, 0.0005335956811904907, 0.0005500391125679016, 0.0005664825439453125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 6.0, 5.0, 5.0, 9.0, 14.0, 24.0, 26.0, 48.0, 81.0, 109.0, 163.0, 296.0, 486.0, 1026.0, 2368.0, 6404.0, 27467.0, 233250.0, 690413.0, 67493.0, 12075.0, 3652.0, 1434.0, 668.0, 369.0, 230.0, 139.0, 101.0, 74.0, 29.0, 24.0, 21.0, 11.0, 8.0, 4.0, 5.0, 3.0, 4.0, 0.0, 6.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-2.4375, -2.36187744140625, -2.2862548828125, -2.21063232421875, -2.135009765625, -2.05938720703125, -1.9837646484375, -1.90814208984375, -1.83251953125, -1.75689697265625, -1.6812744140625, -1.60565185546875, -1.530029296875, -1.45440673828125, -1.3787841796875, -1.30316162109375, -1.2275390625, -1.15191650390625, -1.0762939453125, -1.00067138671875, -0.925048828125, -0.84942626953125, -0.7738037109375, -0.69818115234375, -0.62255859375, -0.54693603515625, -0.4713134765625, -0.39569091796875, -0.320068359375, -0.24444580078125, -0.1688232421875, -0.09320068359375, -0.017578125, 0.05804443359375, 0.1336669921875, 0.20928955078125, 0.284912109375, 0.36053466796875, 0.4361572265625, 0.51177978515625, 0.58740234375, 0.66302490234375, 0.7386474609375, 0.81427001953125, 0.889892578125, 0.96551513671875, 1.0411376953125, 1.11676025390625, 1.1923828125, 1.26800537109375, 1.3436279296875, 1.41925048828125, 1.494873046875, 1.57049560546875, 1.6461181640625, 1.72174072265625, 1.79736328125, 1.87298583984375, 1.9486083984375, 2.02423095703125, 2.099853515625, 2.17547607421875, 2.2510986328125, 2.32672119140625, 2.40234375]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 6.0, 1.0, 7.0, 7.0, 7.0, 7.0, 12.0, 19.0, 20.0, 29.0, 38.0, 31.0, 59.0, 53.0, 70.0, 92.0, 84.0, 87.0, 71.0, 60.0, 44.0, 37.0, 31.0, 27.0, 20.0, 15.0, 17.0, 12.0, 8.0, 9.0, 5.0, 4.0, 4.0, 1.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-2.3515625, -2.286773681640625, -2.22198486328125, -2.157196044921875, -2.0924072265625, -2.027618408203125, -1.96282958984375, -1.898040771484375, -1.833251953125, -1.768463134765625, -1.70367431640625, -1.638885498046875, -1.5740966796875, -1.509307861328125, -1.44451904296875, -1.379730224609375, -1.31494140625, -1.250152587890625, -1.18536376953125, -1.120574951171875, -1.0557861328125, -0.990997314453125, -0.92620849609375, -0.861419677734375, -0.796630859375, -0.731842041015625, -0.66705322265625, -0.602264404296875, -0.5374755859375, -0.472686767578125, -0.40789794921875, -0.343109130859375, -0.2783203125, -0.213531494140625, -0.14874267578125, -0.083953857421875, -0.0191650390625, 0.045623779296875, 0.11041259765625, 0.175201416015625, 0.239990234375, 0.304779052734375, 0.36956787109375, 0.434356689453125, 0.4991455078125, 0.563934326171875, 0.62872314453125, 0.693511962890625, 0.75830078125, 0.823089599609375, 0.88787841796875, 0.952667236328125, 1.0174560546875, 1.082244873046875, 1.14703369140625, 1.211822509765625, 1.276611328125, 1.341400146484375, 1.40618896484375, 1.470977783203125, 1.5357666015625, 1.600555419921875, 1.66534423828125, 1.730133056640625, 1.794921875]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 7.0, 6.0, 11.0, 26.0, 55.0, 83.0, 135.0, 241.0, 175.0, 108.0, 71.0, 37.0, 25.0, 13.0, 3.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-49.515403747558594, -47.71651077270508, -45.91761779785156, -44.11872100830078, -42.319828033447266, -40.52093505859375, -38.722042083740234, -36.92314910888672, -35.12425231933594, -33.32535934448242, -31.526464462280273, -29.727571487426758, -27.92867660522461, -26.129783630371094, -24.330890655517578, -22.53199577331543, -20.733102798461914, -18.9342098236084, -17.13531494140625, -15.336421966552734, -13.537527084350586, -11.73863410949707, -9.939740180969238, -8.140846252441406, -6.341952323913574, -4.543058395385742, -2.7441647052764893, -0.9452710151672363, 0.8536229133605957, 2.6525163650512695, 4.451410293579102, 6.250304222106934, 8.049198150634766, 9.848092079162598, 11.64698600769043, 13.445878982543945, 15.244773864746094, 17.04366683959961, 18.842559814453125, 20.641454696655273, 22.440349578857422, 24.239242553710938, 26.038137435913086, 27.8370304107666, 29.63592529296875, 31.434818267822266, 33.23371124267578, 35.03260803222656, 36.83149719238281, 38.63039016723633, 40.429283142089844, 42.228179931640625, 44.02707290649414, 45.825965881347656, 47.62485885620117, 49.42375183105469, 51.22264862060547, 53.021541595458984, 54.8204345703125, 56.61933135986328, 58.4182243347168, 60.21711730957031, 62.01601028442383, 63.814903259277344, 65.61380004882812]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 7.0, 5.0, 5.0, 7.0, 10.0, 14.0, 9.0, 20.0, 18.0, 18.0, 18.0, 23.0, 27.0, 36.0, 24.0, 39.0, 47.0, 58.0, 71.0, 76.0, 77.0, 54.0, 48.0, 38.0, 39.0, 30.0, 37.0, 26.0, 16.0, 17.0, 15.0, 18.0, 13.0, 9.0, 9.0, 6.0, 7.0, 8.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-35.38645935058594, -34.184654235839844, -32.982845306396484, -31.78104019165039, -30.579235076904297, -29.37742805480957, -28.175621032714844, -26.97381591796875, -25.772008895874023, -24.570201873779297, -23.368396759033203, -22.166589736938477, -20.96478271484375, -19.762977600097656, -18.56117057800293, -17.359363555908203, -16.15755844116211, -14.9557523727417, -13.753946304321289, -12.552139282226562, -11.350333213806152, -10.148527145385742, -8.946720123291016, -7.7449140548706055, -6.543107986450195, -5.341301918029785, -4.139495372772217, -2.9376890659332275, -1.7358827590942383, -0.5340766906738281, 0.6677298545837402, 1.8695363998413086, 3.0713424682617188, 4.273148536682129, 5.474955081939697, 6.676761627197266, 7.878567695617676, 9.080373764038086, 10.282180786132812, 11.483986854553223, 12.685792922973633, 13.887598991394043, 15.089405059814453, 16.29121208190918, 17.493019104003906, 18.69482421875, 19.896631240844727, 21.098438262939453, 22.300243377685547, 23.502050399780273, 24.703855514526367, 25.905662536621094, 27.107467651367188, 28.309274673461914, 29.51108169555664, 30.712886810302734, 31.91469383239746, 33.11650085449219, 34.31830596923828, 35.520111083984375, 36.721920013427734, 37.92372512817383, 39.12553024291992, 40.32733917236328, 41.529144287109375]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 7.0, 5.0, 7.0, 17.0, 26.0, 26.0, 32.0, 51.0, 73.0, 127.0, 187.0, 334.0, 541.0, 958.0, 1804.0, 3450.0, 6995.0, 14549.0, 34507.0, 96531.0, 324965.0, 1147290.0, 1697423.0, 597470.0, 168106.0, 56030.0, 22292.0, 10041.0, 4768.0, 2518.0, 1323.0, 761.0, 384.0, 268.0, 136.0, 85.0, 52.0, 44.0, 26.0, 18.0, 16.0, 8.0, 11.0, 6.0, 5.0, 2.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.919921875, -1.8603668212890625, -1.800811767578125, -1.7412567138671875, -1.68170166015625, -1.6221466064453125, -1.562591552734375, -1.5030364990234375, -1.4434814453125, -1.3839263916015625, -1.324371337890625, -1.2648162841796875, -1.20526123046875, -1.1457061767578125, -1.086151123046875, -1.0265960693359375, -0.967041015625, -0.9074859619140625, -0.847930908203125, -0.7883758544921875, -0.72882080078125, -0.6692657470703125, -0.609710693359375, -0.5501556396484375, -0.4906005859375, -0.4310455322265625, -0.371490478515625, -0.3119354248046875, -0.25238037109375, -0.1928253173828125, -0.133270263671875, -0.0737152099609375, -0.01416015625, 0.0453948974609375, 0.104949951171875, 0.1645050048828125, 0.22406005859375, 0.2836151123046875, 0.343170166015625, 0.4027252197265625, 0.4622802734375, 0.5218353271484375, 0.581390380859375, 0.6409454345703125, 0.70050048828125, 0.7600555419921875, 0.819610595703125, 0.8791656494140625, 0.938720703125, 0.9982757568359375, 1.057830810546875, 1.1173858642578125, 1.17694091796875, 1.2364959716796875, 1.296051025390625, 1.3556060791015625, 1.4151611328125, 1.4747161865234375, 1.534271240234375, 1.5938262939453125, 1.65338134765625, 1.7129364013671875, 1.772491455078125, 1.8320465087890625, 1.8916015625]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 7.0, 8.0, 6.0, 7.0, 5.0, 11.0, 11.0, 18.0, 20.0, 26.0, 33.0, 30.0, 44.0, 42.0, 36.0, 33.0, 49.0, 48.0, 50.0, 55.0, 45.0, 59.0, 41.0, 41.0, 34.0, 38.0, 34.0, 26.0, 29.0, 26.0, 23.0, 13.0, 15.0, 9.0, 9.0, 6.0, 8.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.525390625, -2.451385498046875, -2.37738037109375, -2.303375244140625, -2.2293701171875, -2.155364990234375, -2.08135986328125, -2.007354736328125, -1.933349609375, -1.859344482421875, -1.78533935546875, -1.711334228515625, -1.6373291015625, -1.563323974609375, -1.48931884765625, -1.415313720703125, -1.34130859375, -1.267303466796875, -1.19329833984375, -1.119293212890625, -1.0452880859375, -0.971282958984375, -0.89727783203125, -0.823272705078125, -0.749267578125, -0.675262451171875, -0.60125732421875, -0.527252197265625, -0.4532470703125, -0.379241943359375, -0.30523681640625, -0.231231689453125, -0.1572265625, -0.083221435546875, -0.00921630859375, 0.064788818359375, 0.1387939453125, 0.212799072265625, 0.28680419921875, 0.360809326171875, 0.434814453125, 0.508819580078125, 0.58282470703125, 0.656829833984375, 0.7308349609375, 0.804840087890625, 0.87884521484375, 0.952850341796875, 1.02685546875, 1.100860595703125, 1.17486572265625, 1.248870849609375, 1.3228759765625, 1.396881103515625, 1.47088623046875, 1.544891357421875, 1.618896484375, 1.692901611328125, 1.76690673828125, 1.840911865234375, 1.9149169921875, 1.988922119140625, 2.06292724609375, 2.136932373046875, 2.2109375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 2.0, 8.0, 2.0, 7.0, 7.0, 20.0, 26.0, 30.0, 58.0, 60.0, 121.0, 158.0, 262.0, 571.0, 1409.0, 3625.0, 12009.0, 56665.0, 554888.0, 3317659.0, 210244.0, 27012.0, 5878.0, 1930.0, 747.0, 399.0, 200.0, 110.0, 61.0, 34.0, 24.0, 23.0, 8.0, 6.0, 7.0, 7.0, 3.0, 1.0, 2.0, 3.0, 3.0, 1.0, 1.0], "bins": [-6.80078125, -6.632171630859375, -6.46356201171875, -6.294952392578125, -6.1263427734375, -5.957733154296875, -5.78912353515625, -5.620513916015625, -5.451904296875, -5.283294677734375, -5.11468505859375, -4.946075439453125, -4.7774658203125, -4.608856201171875, -4.44024658203125, -4.271636962890625, -4.10302734375, -3.934417724609375, -3.76580810546875, -3.597198486328125, -3.4285888671875, -3.259979248046875, -3.09136962890625, -2.922760009765625, -2.754150390625, -2.585540771484375, -2.41693115234375, -2.248321533203125, -2.0797119140625, -1.911102294921875, -1.74249267578125, -1.573883056640625, -1.4052734375, -1.236663818359375, -1.06805419921875, -0.899444580078125, -0.7308349609375, -0.562225341796875, -0.39361572265625, -0.225006103515625, -0.056396484375, 0.112213134765625, 0.28082275390625, 0.449432373046875, 0.6180419921875, 0.786651611328125, 0.95526123046875, 1.123870849609375, 1.29248046875, 1.461090087890625, 1.62969970703125, 1.798309326171875, 1.9669189453125, 2.135528564453125, 2.30413818359375, 2.472747802734375, 2.641357421875, 2.809967041015625, 2.97857666015625, 3.147186279296875, 3.3157958984375, 3.484405517578125, 3.65301513671875, 3.821624755859375, 3.990234375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 6.0, 2.0, 4.0, 9.0, 7.0, 15.0, 21.0, 27.0, 41.0, 69.0, 111.0, 166.0, 378.0, 821.0, 1126.0, 663.0, 272.0, 157.0, 70.0, 44.0, 25.0, 28.0, 10.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-10.859375, -10.596435546875, -10.33349609375, -10.070556640625, -9.8076171875, -9.544677734375, -9.28173828125, -9.018798828125, -8.755859375, -8.492919921875, -8.22998046875, -7.967041015625, -7.7041015625, -7.441162109375, -7.17822265625, -6.915283203125, -6.65234375, -6.389404296875, -6.12646484375, -5.863525390625, -5.6005859375, -5.337646484375, -5.07470703125, -4.811767578125, -4.548828125, -4.285888671875, -4.02294921875, -3.760009765625, -3.4970703125, -3.234130859375, -2.97119140625, -2.708251953125, -2.4453125, -2.182373046875, -1.91943359375, -1.656494140625, -1.3935546875, -1.130615234375, -0.86767578125, -0.604736328125, -0.341796875, -0.078857421875, 0.18408203125, 0.447021484375, 0.7099609375, 0.972900390625, 1.23583984375, 1.498779296875, 1.76171875, 2.024658203125, 2.28759765625, 2.550537109375, 2.8134765625, 3.076416015625, 3.33935546875, 3.602294921875, 3.865234375, 4.128173828125, 4.39111328125, 4.654052734375, 4.9169921875, 5.179931640625, 5.44287109375, 5.705810546875, 5.96875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 2.0, 5.0, 3.0, 6.0, 13.0, 24.0, 93.0, 194.0, 312.0, 200.0, 96.0, 30.0, 15.0, 4.0, 4.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.0848388671875, -62.64365768432617, -60.202476501464844, -57.76129913330078, -55.32011795043945, -52.878936767578125, -50.43775939941406, -47.996578216552734, -45.555397033691406, -43.11421585083008, -40.67303466796875, -38.23185729980469, -35.79067611694336, -33.34949493408203, -30.908315658569336, -28.46713638305664, -26.025955200195312, -23.584774017333984, -21.14359474182129, -18.702415466308594, -16.261234283447266, -13.820054054260254, -11.378873825073242, -8.937694549560547, -6.496513366699219, -4.055333137512207, -1.6141529083251953, 0.8270273208618164, 3.268207550048828, 5.70938777923584, 8.150568008422852, 10.591747283935547, 13.032928466796875, 15.474108695983887, 17.9152889251709, 20.356468200683594, 22.797649383544922, 25.23883056640625, 27.680009841918945, 30.12118911743164, 32.56237030029297, 35.0035514831543, 37.444732666015625, 39.88591003417969, 42.327091217041016, 44.768272399902344, 47.209449768066406, 49.650630950927734, 52.09181213378906, 54.53299331665039, 56.97417449951172, 59.41535186767578, 61.85653305053711, 64.29771423339844, 66.7388916015625, 69.18006896972656, 71.62125396728516, 74.06243133544922, 76.50361633300781, 78.94479370117188, 81.38597106933594, 83.82715606689453, 86.2683334350586, 88.70951843261719, 91.15069580078125]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 7.0, 4.0, 4.0, 6.0, 4.0, 7.0, 11.0, 9.0, 9.0, 20.0, 19.0, 23.0, 18.0, 27.0, 28.0, 30.0, 28.0, 50.0, 43.0, 39.0, 44.0, 41.0, 41.0, 43.0, 44.0, 41.0, 31.0, 36.0, 35.0, 33.0, 29.0, 24.0, 29.0, 22.0, 25.0, 21.0, 18.0, 12.0, 13.0, 11.0, 5.0, 1.0, 2.0, 4.0, 2.0, 7.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-22.15709686279297, -21.41603660583496, -20.674978256225586, -19.933917999267578, -19.192859649658203, -18.451799392700195, -17.710739135742188, -16.969680786132812, -16.228620529174805, -15.487561225891113, -14.746501922607422, -14.005441665649414, -13.264382362365723, -12.523323059082031, -11.782262802124023, -11.041203498840332, -10.30014419555664, -9.55908489227295, -8.818025588989258, -8.07696533203125, -7.335906028747559, -6.594846725463867, -5.853786945343018, -5.112727165222168, -4.371667861938477, -3.630608320236206, -2.8895487785339355, -2.148489236831665, -1.4074296951293945, -0.666370153427124, 0.07468938827514648, 0.8157491683959961, 1.5568084716796875, 2.297868013381958, 3.0389275550842285, 3.779987096786499, 4.5210466384887695, 5.262105941772461, 6.0031657218933105, 6.74422550201416, 7.485284805297852, 8.226344108581543, 8.967403411865234, 9.708463668823242, 10.449522972106934, 11.190582275390625, 11.931642532348633, 12.672701835632324, 13.413761138916016, 14.154820442199707, 14.895879745483398, 15.636940002441406, 16.37799835205078, 17.11905860900879, 17.860118865966797, 18.601177215576172, 19.34223747253418, 20.083297729492188, 20.824356079101562, 21.56541633605957, 22.306476593017578, 23.047534942626953, 23.78859519958496, 24.52965545654297, 25.270713806152344]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 1.0, 6.0, 1.0, 2.0, 11.0, 9.0, 29.0, 31.0, 53.0, 77.0, 104.0, 170.0, 249.0, 345.0, 526.0, 859.0, 1366.0, 2251.0, 3927.0, 6365.0, 11472.0, 21189.0, 40431.0, 75584.0, 144374.0, 238038.0, 224963.0, 129172.0, 67445.0, 35161.0, 19248.0, 10336.0, 5715.0, 3461.0, 1977.0, 1267.0, 782.0, 527.0, 358.0, 227.0, 164.0, 87.0, 64.0, 50.0, 33.0, 22.0, 13.0, 7.0, 8.0, 7.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.52734375, -2.442840576171875, -2.35833740234375, -2.273834228515625, -2.1893310546875, -2.104827880859375, -2.02032470703125, -1.935821533203125, -1.851318359375, -1.766815185546875, -1.68231201171875, -1.597808837890625, -1.5133056640625, -1.428802490234375, -1.34429931640625, -1.259796142578125, -1.17529296875, -1.090789794921875, -1.00628662109375, -0.921783447265625, -0.8372802734375, -0.752777099609375, -0.66827392578125, -0.583770751953125, -0.499267578125, -0.414764404296875, -0.33026123046875, -0.245758056640625, -0.1612548828125, -0.076751708984375, 0.00775146484375, 0.092254638671875, 0.1767578125, 0.261260986328125, 0.34576416015625, 0.430267333984375, 0.5147705078125, 0.599273681640625, 0.68377685546875, 0.768280029296875, 0.852783203125, 0.937286376953125, 1.02178955078125, 1.106292724609375, 1.1907958984375, 1.275299072265625, 1.35980224609375, 1.444305419921875, 1.52880859375, 1.613311767578125, 1.69781494140625, 1.782318115234375, 1.8668212890625, 1.951324462890625, 2.03582763671875, 2.120330810546875, 2.204833984375, 2.289337158203125, 2.37384033203125, 2.458343505859375, 2.5428466796875, 2.627349853515625, 2.71185302734375, 2.796356201171875, 2.880859375]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 2.0, 3.0, 7.0, 4.0, 1.0, 6.0, 7.0, 9.0, 18.0, 22.0, 24.0, 20.0, 22.0, 29.0, 30.0, 36.0, 37.0, 36.0, 43.0, 42.0, 40.0, 55.0, 46.0, 49.0, 57.0, 45.0, 27.0, 37.0, 35.0, 30.0, 25.0, 23.0, 36.0, 22.0, 18.0, 12.0, 15.0, 6.0, 11.0, 7.0, 4.0, 4.0, 3.0, 1.0, 0.0, 4.0, 3.0, 3.0], "bins": [-2.63671875, -2.567718505859375, -2.49871826171875, -2.429718017578125, -2.3607177734375, -2.291717529296875, -2.22271728515625, -2.153717041015625, -2.084716796875, -2.015716552734375, -1.94671630859375, -1.877716064453125, -1.8087158203125, -1.739715576171875, -1.67071533203125, -1.601715087890625, -1.53271484375, -1.463714599609375, -1.39471435546875, -1.325714111328125, -1.2567138671875, -1.187713623046875, -1.11871337890625, -1.049713134765625, -0.980712890625, -0.911712646484375, -0.84271240234375, -0.773712158203125, -0.7047119140625, -0.635711669921875, -0.56671142578125, -0.497711181640625, -0.4287109375, -0.359710693359375, -0.29071044921875, -0.221710205078125, -0.1527099609375, -0.083709716796875, -0.01470947265625, 0.054290771484375, 0.123291015625, 0.192291259765625, 0.26129150390625, 0.330291748046875, 0.3992919921875, 0.468292236328125, 0.53729248046875, 0.606292724609375, 0.67529296875, 0.744293212890625, 0.81329345703125, 0.882293701171875, 0.9512939453125, 1.020294189453125, 1.08929443359375, 1.158294677734375, 1.227294921875, 1.296295166015625, 1.36529541015625, 1.434295654296875, 1.5032958984375, 1.572296142578125, 1.64129638671875, 1.710296630859375, 1.779296875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 10.0, 4.0, 19.0, 14.0, 27.0, 28.0, 26.0, 61.0, 100.0, 107.0, 176.0, 228.0, 381.0, 539.0, 929.0, 1710.0, 3896.0, 12626.0, 65361.0, 570371.0, 326689.0, 48043.0, 9738.0, 3385.0, 1501.0, 817.0, 557.0, 330.0, 238.0, 176.0, 115.0, 98.0, 67.0, 43.0, 32.0, 25.0, 20.0, 17.0, 15.0, 6.0, 9.0, 4.0, 6.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.3828125, -7.15850830078125, -6.9342041015625, -6.70989990234375, -6.485595703125, -6.26129150390625, -6.0369873046875, -5.81268310546875, -5.58837890625, -5.36407470703125, -5.1397705078125, -4.91546630859375, -4.691162109375, -4.46685791015625, -4.2425537109375, -4.01824951171875, -3.7939453125, -3.56964111328125, -3.3453369140625, -3.12103271484375, -2.896728515625, -2.67242431640625, -2.4481201171875, -2.22381591796875, -1.99951171875, -1.77520751953125, -1.5509033203125, -1.32659912109375, -1.102294921875, -0.87799072265625, -0.6536865234375, -0.42938232421875, -0.205078125, 0.01922607421875, 0.2435302734375, 0.46783447265625, 0.692138671875, 0.91644287109375, 1.1407470703125, 1.36505126953125, 1.58935546875, 1.81365966796875, 2.0379638671875, 2.26226806640625, 2.486572265625, 2.71087646484375, 2.9351806640625, 3.15948486328125, 3.3837890625, 3.60809326171875, 3.8323974609375, 4.05670166015625, 4.281005859375, 4.50531005859375, 4.7296142578125, 4.95391845703125, 5.17822265625, 5.40252685546875, 5.6268310546875, 5.85113525390625, 6.075439453125, 6.29974365234375, 6.5240478515625, 6.74835205078125, 6.97265625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 7.0, 4.0, 5.0, 12.0, 9.0, 16.0, 21.0, 24.0, 35.0, 26.0, 38.0, 34.0, 61.0, 42.0, 42.0, 47.0, 57.0, 55.0, 55.0, 64.0, 64.0, 37.0, 39.0, 37.0, 16.0, 28.0, 26.0, 16.0, 24.0, 16.0, 11.0, 9.0, 10.0, 7.0, 8.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.13671875, -6.84820556640625, -6.5596923828125, -6.27117919921875, -5.982666015625, -5.69415283203125, -5.4056396484375, -5.11712646484375, -4.82861328125, -4.54010009765625, -4.2515869140625, -3.96307373046875, -3.674560546875, -3.38604736328125, -3.0975341796875, -2.80902099609375, -2.5205078125, -2.23199462890625, -1.9434814453125, -1.65496826171875, -1.366455078125, -1.07794189453125, -0.7894287109375, -0.50091552734375, -0.21240234375, 0.07611083984375, 0.3646240234375, 0.65313720703125, 0.941650390625, 1.23016357421875, 1.5186767578125, 1.80718994140625, 2.095703125, 2.38421630859375, 2.6727294921875, 2.96124267578125, 3.249755859375, 3.53826904296875, 3.8267822265625, 4.11529541015625, 4.40380859375, 4.69232177734375, 4.9808349609375, 5.26934814453125, 5.557861328125, 5.84637451171875, 6.1348876953125, 6.42340087890625, 6.7119140625, 7.00042724609375, 7.2889404296875, 7.57745361328125, 7.865966796875, 8.15447998046875, 8.4429931640625, 8.73150634765625, 9.02001953125, 9.30853271484375, 9.5970458984375, 9.88555908203125, 10.174072265625, 10.46258544921875, 10.7510986328125, 11.03961181640625, 11.328125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 1.0, 5.0, 6.0, 7.0, 14.0, 35.0, 53.0, 101.0, 279.0, 881.0, 4456.0, 72147.0, 896729.0, 68151.0, 4359.0, 858.0, 240.0, 116.0, 51.0, 23.0, 20.0, 5.0, 3.0, 8.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8203125, -2.6890869140625, -2.557861328125, -2.4266357421875, -2.29541015625, -2.1641845703125, -2.032958984375, -1.9017333984375, -1.7705078125, -1.6392822265625, -1.508056640625, -1.3768310546875, -1.24560546875, -1.1143798828125, -0.983154296875, -0.8519287109375, -0.720703125, -0.5894775390625, -0.458251953125, -0.3270263671875, -0.19580078125, -0.0645751953125, 0.066650390625, 0.1978759765625, 0.3291015625, 0.4603271484375, 0.591552734375, 0.7227783203125, 0.85400390625, 0.9852294921875, 1.116455078125, 1.2476806640625, 1.37890625, 1.5101318359375, 1.641357421875, 1.7725830078125, 1.90380859375, 2.0350341796875, 2.166259765625, 2.2974853515625, 2.4287109375, 2.5599365234375, 2.691162109375, 2.8223876953125, 2.95361328125, 3.0848388671875, 3.216064453125, 3.3472900390625, 3.478515625, 3.6097412109375, 3.740966796875, 3.8721923828125, 4.00341796875, 4.1346435546875, 4.265869140625, 4.3970947265625, 4.5283203125, 4.6595458984375, 4.790771484375, 4.9219970703125, 5.05322265625, 5.1844482421875, 5.315673828125, 5.4468994140625, 5.578125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 6.0, 3.0, 4.0, 6.0, 7.0, 8.0, 13.0, 16.0, 13.0, 17.0, 21.0, 36.0, 36.0, 53.0, 51.0, 71.0, 74.0, 76.0, 62.0, 91.0, 65.0, 60.0, 43.0, 43.0, 30.0, 24.0, 10.0, 16.0, 14.0, 8.0, 5.0, 9.0, 4.0, 3.0, 2.0, 3.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0006165504455566406, -0.0005993470549583435, -0.0005821436643600464, -0.0005649402737617493, -0.0005477368831634521, -0.000530533492565155, -0.0005133301019668579, -0.0004961267113685608, -0.00047892332077026367, -0.00046171993017196655, -0.00044451653957366943, -0.0004273131489753723, -0.0004101097583770752, -0.0003929063677787781, -0.00037570297718048096, -0.00035849958658218384, -0.0003412961959838867, -0.0003240928053855896, -0.0003068894147872925, -0.00028968602418899536, -0.00027248263359069824, -0.0002552792429924011, -0.000238075852394104, -0.00022087246179580688, -0.00020366907119750977, -0.00018646568059921265, -0.00016926229000091553, -0.0001520588994026184, -0.0001348555088043213, -0.00011765211820602417, -0.00010044872760772705, -8.324533700942993e-05, -6.604194641113281e-05, -4.883855581283569e-05, -3.1635165214538574e-05, -1.4431774616241455e-05, 2.771615982055664e-06, 1.9975006580352783e-05, 3.71783971786499e-05, 5.438178777694702e-05, 7.158517837524414e-05, 8.878856897354126e-05, 0.00010599195957183838, 0.0001231953501701355, 0.00014039874076843262, 0.00015760213136672974, 0.00017480552196502686, 0.00019200891256332397, 0.0002092123031616211, 0.0002264156937599182, 0.00024361908435821533, 0.00026082247495651245, 0.00027802586555480957, 0.0002952292561531067, 0.0003124326467514038, 0.00032963603734970093, 0.00034683942794799805, 0.00036404281854629517, 0.0003812462091445923, 0.0003984495997428894, 0.0004156529903411865, 0.00043285638093948364, 0.00045005977153778076, 0.0004672631621360779, 0.000484466552734375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 3.0, 5.0, 1.0, 8.0, 17.0, 11.0, 20.0, 33.0, 51.0, 94.0, 135.0, 241.0, 413.0, 788.0, 1548.0, 3780.0, 12479.0, 71792.0, 596433.0, 303248.0, 42882.0, 8724.0, 3041.0, 1268.0, 656.0, 345.0, 193.0, 127.0, 78.0, 53.0, 37.0, 24.0, 15.0, 8.0, 4.0, 5.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.34765625, -2.2856597900390625, -2.223663330078125, -2.1616668701171875, -2.09967041015625, -2.0376739501953125, -1.975677490234375, -1.9136810302734375, -1.8516845703125, -1.7896881103515625, -1.727691650390625, -1.6656951904296875, -1.60369873046875, -1.5417022705078125, -1.479705810546875, -1.4177093505859375, -1.355712890625, -1.2937164306640625, -1.231719970703125, -1.1697235107421875, -1.10772705078125, -1.0457305908203125, -0.983734130859375, -0.9217376708984375, -0.8597412109375, -0.7977447509765625, -0.735748291015625, -0.6737518310546875, -0.61175537109375, -0.5497589111328125, -0.487762451171875, -0.4257659912109375, -0.36376953125, -0.3017730712890625, -0.239776611328125, -0.1777801513671875, -0.11578369140625, -0.0537872314453125, 0.008209228515625, 0.0702056884765625, 0.1322021484375, 0.1941986083984375, 0.256195068359375, 0.3181915283203125, 0.38018798828125, 0.4421844482421875, 0.504180908203125, 0.5661773681640625, 0.628173828125, 0.6901702880859375, 0.752166748046875, 0.8141632080078125, 0.87615966796875, 0.9381561279296875, 1.000152587890625, 1.0621490478515625, 1.1241455078125, 1.1861419677734375, 1.248138427734375, 1.3101348876953125, 1.37213134765625, 1.4341278076171875, 1.496124267578125, 1.5581207275390625, 1.6201171875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 6.0, 2.0, 2.0, 5.0, 6.0, 5.0, 12.0, 5.0, 12.0, 18.0, 18.0, 8.0, 29.0, 25.0, 37.0, 35.0, 39.0, 38.0, 49.0, 57.0, 53.0, 49.0, 48.0, 46.0, 56.0, 54.0, 34.0, 37.0, 26.0, 37.0, 26.0, 30.0, 24.0, 14.0, 15.0, 7.0, 14.0, 8.0, 7.0, 6.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.3359375, -1.29400634765625, -1.2520751953125, -1.21014404296875, -1.168212890625, -1.12628173828125, -1.0843505859375, -1.04241943359375, -1.00048828125, -0.95855712890625, -0.9166259765625, -0.87469482421875, -0.832763671875, -0.79083251953125, -0.7489013671875, -0.70697021484375, -0.6650390625, -0.62310791015625, -0.5811767578125, -0.53924560546875, -0.497314453125, -0.45538330078125, -0.4134521484375, -0.37152099609375, -0.32958984375, -0.28765869140625, -0.2457275390625, -0.20379638671875, -0.161865234375, -0.11993408203125, -0.0780029296875, -0.03607177734375, 0.005859375, 0.04779052734375, 0.0897216796875, 0.13165283203125, 0.173583984375, 0.21551513671875, 0.2574462890625, 0.29937744140625, 0.34130859375, 0.38323974609375, 0.4251708984375, 0.46710205078125, 0.509033203125, 0.55096435546875, 0.5928955078125, 0.63482666015625, 0.6767578125, 0.71868896484375, 0.7606201171875, 0.80255126953125, 0.844482421875, 0.88641357421875, 0.9283447265625, 0.97027587890625, 1.01220703125, 1.05413818359375, 1.0960693359375, 1.13800048828125, 1.179931640625, 1.22186279296875, 1.2637939453125, 1.30572509765625, 1.34765625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 7.0, 25.0, 77.0, 284.0, 402.0, 148.0, 33.0, 12.0, 9.0, 2.0, 0.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.11856842041016, -80.77030944824219, -77.42205047607422, -74.07379150390625, -70.72554016113281, -67.37728118896484, -64.02902221679688, -60.680763244628906, -57.3325080871582, -53.984249114990234, -50.63599395751953, -47.28773498535156, -43.939476013183594, -40.59122085571289, -37.24296188354492, -33.89470672607422, -30.54644775390625, -27.198190689086914, -23.849933624267578, -20.50167465209961, -17.153417587280273, -13.805160522460938, -10.456901550292969, -7.108644485473633, -3.760387420654297, -0.41212987899780273, 2.9361276626586914, 6.284385681152344, 9.63264274597168, 12.980899810791016, 16.329158782958984, 19.67741584777832, 23.025680541992188, 26.373937606811523, 29.72219467163086, 33.07045364379883, 36.41870880126953, 39.7669677734375, 43.11522674560547, 46.46348571777344, 49.81174087524414, 53.15999984741211, 56.50825500488281, 59.85651397705078, 63.20477294921875, 66.55302429199219, 69.90129089355469, 73.24954223632812, 76.5978012084961, 79.94606018066406, 83.29431915283203, 86.642578125, 89.99082946777344, 93.3390884399414, 96.68734741210938, 100.03560638427734, 103.38386535644531, 106.73212432861328, 110.08038330078125, 113.42863464355469, 116.77689361572266, 120.12515258789062, 123.4734115600586, 126.82167053222656, 130.169921875]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 5.0, 4.0, 4.0, 6.0, 11.0, 11.0, 13.0, 8.0, 24.0, 17.0, 21.0, 23.0, 21.0, 31.0, 26.0, 28.0, 49.0, 45.0, 63.0, 70.0, 74.0, 61.0, 57.0, 31.0, 27.0, 37.0, 33.0, 27.0, 30.0, 29.0, 20.0, 22.0, 13.0, 9.0, 12.0, 8.0, 8.0, 6.0, 8.0, 4.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-30.632476806640625, -29.653396606445312, -28.674314498901367, -27.695232391357422, -26.71615219116211, -25.737071990966797, -24.75798988342285, -23.778907775878906, -22.799827575683594, -21.82074737548828, -20.841665267944336, -19.86258316040039, -18.883502960205078, -17.904422760009766, -16.92534065246582, -15.946259498596191, -14.967178344726562, -13.988097190856934, -13.009016036987305, -12.029934883117676, -11.050853729248047, -10.071772575378418, -9.092691421508789, -8.11361026763916, -7.134529113769531, -6.155447959899902, -5.176366806030273, -4.1972856521606445, -3.2182044982910156, -2.2391233444213867, -1.2600421905517578, -0.2809610366821289, 0.6981201171875, 1.677201271057129, 2.656282424926758, 3.6353635787963867, 4.614444732666016, 5.5935258865356445, 6.572607040405273, 7.551688194274902, 8.530769348144531, 9.50985050201416, 10.488931655883789, 11.468012809753418, 12.447093963623047, 13.426175117492676, 14.405256271362305, 15.384337425231934, 16.363418579101562, 17.342498779296875, 18.32158088684082, 19.300662994384766, 20.279743194580078, 21.25882339477539, 22.237905502319336, 23.21698760986328, 24.196067810058594, 25.175148010253906, 26.15423011779785, 27.133312225341797, 28.11239242553711, 29.091472625732422, 30.070554733276367, 31.049636840820312, 32.028717041015625]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 3.0, 8.0, 14.0, 15.0, 24.0, 32.0, 53.0, 73.0, 153.0, 255.0, 447.0, 860.0, 1688.0, 3739.0, 9156.0, 27326.0, 112407.0, 593988.0, 2147590.0, 1041733.0, 189736.0, 41608.0, 13214.0, 5259.0, 2308.0, 1159.0, 579.0, 340.0, 184.0, 123.0, 69.0, 43.0, 24.0, 23.0, 10.0, 13.0, 5.0, 7.0, 4.0, 4.0, 4.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.67578125, -1.60784912109375, -1.5399169921875, -1.47198486328125, -1.404052734375, -1.33612060546875, -1.2681884765625, -1.20025634765625, -1.13232421875, -1.06439208984375, -0.9964599609375, -0.92852783203125, -0.860595703125, -0.79266357421875, -0.7247314453125, -0.65679931640625, -0.5888671875, -0.52093505859375, -0.4530029296875, -0.38507080078125, -0.317138671875, -0.24920654296875, -0.1812744140625, -0.11334228515625, -0.04541015625, 0.02252197265625, 0.0904541015625, 0.15838623046875, 0.226318359375, 0.29425048828125, 0.3621826171875, 0.43011474609375, 0.498046875, 0.56597900390625, 0.6339111328125, 0.70184326171875, 0.769775390625, 0.83770751953125, 0.9056396484375, 0.97357177734375, 1.04150390625, 1.10943603515625, 1.1773681640625, 1.24530029296875, 1.313232421875, 1.38116455078125, 1.4490966796875, 1.51702880859375, 1.5849609375, 1.65289306640625, 1.7208251953125, 1.78875732421875, 1.856689453125, 1.92462158203125, 1.9925537109375, 2.06048583984375, 2.12841796875, 2.19635009765625, 2.2642822265625, 2.33221435546875, 2.400146484375, 2.46807861328125, 2.5360107421875, 2.60394287109375, 2.671875]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 2.0, 2.0, 8.0, 10.0, 10.0, 27.0, 14.0, 25.0, 23.0, 34.0, 42.0, 43.0, 41.0, 45.0, 52.0, 49.0, 47.0, 57.0, 57.0, 45.0, 53.0, 45.0, 47.0, 36.0, 33.0, 34.0, 27.0, 20.0, 18.0, 12.0, 9.0, 5.0, 12.0, 10.0, 6.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.54296875, -2.468963623046875, -2.39495849609375, -2.320953369140625, -2.2469482421875, -2.172943115234375, -2.09893798828125, -2.024932861328125, -1.950927734375, -1.876922607421875, -1.80291748046875, -1.728912353515625, -1.6549072265625, -1.580902099609375, -1.50689697265625, -1.432891845703125, -1.35888671875, -1.284881591796875, -1.21087646484375, -1.136871337890625, -1.0628662109375, -0.988861083984375, -0.91485595703125, -0.840850830078125, -0.766845703125, -0.692840576171875, -0.61883544921875, -0.544830322265625, -0.4708251953125, -0.396820068359375, -0.32281494140625, -0.248809814453125, -0.1748046875, -0.100799560546875, -0.02679443359375, 0.047210693359375, 0.1212158203125, 0.195220947265625, 0.26922607421875, 0.343231201171875, 0.417236328125, 0.491241455078125, 0.56524658203125, 0.639251708984375, 0.7132568359375, 0.787261962890625, 0.86126708984375, 0.935272216796875, 1.00927734375, 1.083282470703125, 1.15728759765625, 1.231292724609375, 1.3052978515625, 1.379302978515625, 1.45330810546875, 1.527313232421875, 1.601318359375, 1.675323486328125, 1.74932861328125, 1.823333740234375, 1.8973388671875, 1.971343994140625, 2.04534912109375, 2.119354248046875, 2.193359375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 0.0, 4.0, 3.0, 8.0, 12.0, 11.0, 23.0, 52.0, 103.0, 239.0, 515.0, 1623.0, 9362.0, 245970.0, 3877120.0, 52687.0, 4470.0, 1154.0, 468.0, 216.0, 113.0, 51.0, 35.0, 17.0, 13.0, 11.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.953125, -9.6712646484375, -9.389404296875, -9.1075439453125, -8.82568359375, -8.5438232421875, -8.261962890625, -7.9801025390625, -7.6982421875, -7.4163818359375, -7.134521484375, -6.8526611328125, -6.57080078125, -6.2889404296875, -6.007080078125, -5.7252197265625, -5.443359375, -5.1614990234375, -4.879638671875, -4.5977783203125, -4.31591796875, -4.0340576171875, -3.752197265625, -3.4703369140625, -3.1884765625, -2.9066162109375, -2.624755859375, -2.3428955078125, -2.06103515625, -1.7791748046875, -1.497314453125, -1.2154541015625, -0.93359375, -0.6517333984375, -0.369873046875, -0.0880126953125, 0.19384765625, 0.4757080078125, 0.757568359375, 1.0394287109375, 1.3212890625, 1.6031494140625, 1.885009765625, 2.1668701171875, 2.44873046875, 2.7305908203125, 3.012451171875, 3.2943115234375, 3.576171875, 3.8580322265625, 4.139892578125, 4.4217529296875, 4.70361328125, 4.9854736328125, 5.267333984375, 5.5491943359375, 5.8310546875, 6.1129150390625, 6.394775390625, 6.6766357421875, 6.95849609375, 7.2403564453125, 7.522216796875, 7.8040771484375, 8.0859375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 5.0, 5.0, 7.0, 14.0, 18.0, 35.0, 57.0, 118.0, 270.0, 766.0, 1331.0, 840.0, 336.0, 120.0, 58.0, 38.0, 25.0, 11.0, 9.0, 10.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.38671875, -7.12823486328125, -6.8697509765625, -6.61126708984375, -6.352783203125, -6.09429931640625, -5.8358154296875, -5.57733154296875, -5.31884765625, -5.06036376953125, -4.8018798828125, -4.54339599609375, -4.284912109375, -4.02642822265625, -3.7679443359375, -3.50946044921875, -3.2509765625, -2.99249267578125, -2.7340087890625, -2.47552490234375, -2.217041015625, -1.95855712890625, -1.7000732421875, -1.44158935546875, -1.18310546875, -0.92462158203125, -0.6661376953125, -0.40765380859375, -0.149169921875, 0.10931396484375, 0.3677978515625, 0.62628173828125, 0.884765625, 1.14324951171875, 1.4017333984375, 1.66021728515625, 1.918701171875, 2.17718505859375, 2.4356689453125, 2.69415283203125, 2.95263671875, 3.21112060546875, 3.4696044921875, 3.72808837890625, 3.986572265625, 4.24505615234375, 4.5035400390625, 4.76202392578125, 5.0205078125, 5.27899169921875, 5.5374755859375, 5.79595947265625, 6.054443359375, 6.31292724609375, 6.5714111328125, 6.82989501953125, 7.08837890625, 7.34686279296875, 7.6053466796875, 7.86383056640625, 8.122314453125, 8.38079833984375, 8.6392822265625, 8.89776611328125, 9.15625]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 9.0, 22.0, 383.0, 507.0, 58.0, 17.0, 4.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-92.98286437988281, -87.84374237060547, -82.70462036132812, -77.56549835205078, -72.42637634277344, -67.2872543334961, -62.14813232421875, -57.009010314941406, -51.86988830566406, -46.73076629638672, -41.591644287109375, -36.45252227783203, -31.313400268554688, -26.174278259277344, -21.03515625, -15.896034240722656, -10.756912231445312, -5.617790222167969, -0.478668212890625, 4.660453796386719, 9.799575805664062, 14.938697814941406, 20.07781982421875, 25.216941833496094, 30.356063842773438, 35.49518585205078, 40.634307861328125, 45.77342987060547, 50.91255187988281, 56.051673889160156, 61.1907958984375, 66.32991790771484, 71.46902465820312, 76.60814666748047, 81.74726867675781, 86.88639068603516, 92.0255126953125, 97.16463470458984, 102.30375671386719, 107.44287872314453, 112.58200073242188, 117.72112274169922, 122.86024475097656, 127.9993667602539, 133.13848876953125, 138.27761840820312, 143.41673278808594, 148.55584716796875, 153.69497680664062, 158.8341064453125, 163.9732208251953, 169.11233520507812, 174.25146484375, 179.39059448242188, 184.5297088623047, 189.6688232421875, 194.80795288085938, 199.94708251953125, 205.08619689941406, 210.22531127929688, 215.36444091796875, 220.50357055664062, 225.64268493652344, 230.78179931640625, 235.92092895507812]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 5.0, 3.0, 6.0, 21.0, 18.0, 9.0, 17.0, 29.0, 34.0, 55.0, 58.0, 75.0, 73.0, 92.0, 75.0, 91.0, 80.0, 53.0, 60.0, 46.0, 33.0, 22.0, 16.0, 15.0, 9.0, 7.0, 6.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.274860382080078, -28.04176139831543, -26.80866241455078, -25.575563430786133, -24.342464447021484, -23.10936737060547, -21.87626838684082, -20.643169403076172, -19.410070419311523, -18.176971435546875, -16.943872451782227, -15.710774421691895, -14.477675437927246, -13.244576454162598, -12.011478424072266, -10.778379440307617, -9.545280456542969, -8.31218147277832, -7.07908296585083, -5.84598445892334, -4.612885475158691, -3.379786491394043, -2.1466879844665527, -0.9135894775390625, 0.31950950622558594, 1.5526082515716553, 2.7857069969177246, 4.018805503845215, 5.251904487609863, 6.485003471374512, 7.718101978302002, 8.951200485229492, 10.18429946899414, 11.417398452758789, 12.650497436523438, 13.88359546661377, 15.116694450378418, 16.34979248046875, 17.5828914642334, 18.815990447998047, 20.049089431762695, 21.282188415527344, 22.515287399291992, 23.74838638305664, 24.981483459472656, 26.214584350585938, 27.447681427001953, 28.6807804107666, 29.91387939453125, 31.1469783782959, 32.38007736206055, 33.61317443847656, 34.846275329589844, 36.07937240600586, 37.31247329711914, 38.545570373535156, 39.77867126464844, 41.01176834106445, 42.244869232177734, 43.47796630859375, 44.71106719970703, 45.94416427612305, 47.17726516723633, 48.410362243652344, 49.64345932006836]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 6.0, 4.0, 10.0, 4.0, 20.0, 22.0, 24.0, 57.0, 119.0, 149.0, 251.0, 401.0, 664.0, 1136.0, 2138.0, 3986.0, 8149.0, 16581.0, 35494.0, 78201.0, 163021.0, 260150.0, 234040.0, 130073.0, 59929.0, 27156.0, 13034.0, 6394.0, 3260.0, 1655.0, 1011.0, 549.0, 339.0, 201.0, 120.0, 71.0, 55.0, 36.0, 18.0, 14.0, 15.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.080078125, -1.9927978515625, -1.905517578125, -1.8182373046875, -1.73095703125, -1.6436767578125, -1.556396484375, -1.4691162109375, -1.3818359375, -1.2945556640625, -1.207275390625, -1.1199951171875, -1.03271484375, -0.9454345703125, -0.858154296875, -0.7708740234375, -0.68359375, -0.5963134765625, -0.509033203125, -0.4217529296875, -0.33447265625, -0.2471923828125, -0.159912109375, -0.0726318359375, 0.0146484375, 0.1019287109375, 0.189208984375, 0.2764892578125, 0.36376953125, 0.4510498046875, 0.538330078125, 0.6256103515625, 0.712890625, 0.8001708984375, 0.887451171875, 0.9747314453125, 1.06201171875, 1.1492919921875, 1.236572265625, 1.3238525390625, 1.4111328125, 1.4984130859375, 1.585693359375, 1.6729736328125, 1.76025390625, 1.8475341796875, 1.934814453125, 2.0220947265625, 2.109375, 2.1966552734375, 2.283935546875, 2.3712158203125, 2.45849609375, 2.5457763671875, 2.633056640625, 2.7203369140625, 2.8076171875, 2.8948974609375, 2.982177734375, 3.0694580078125, 3.15673828125, 3.2440185546875, 3.331298828125, 3.4185791015625, 3.505859375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 5.0, 6.0, 12.0, 7.0, 14.0, 18.0, 11.0, 16.0, 26.0, 23.0, 37.0, 37.0, 43.0, 39.0, 48.0, 52.0, 47.0, 43.0, 39.0, 48.0, 52.0, 32.0, 43.0, 39.0, 36.0, 38.0, 27.0, 22.0, 28.0, 17.0, 18.0, 15.0, 15.0, 7.0, 14.0, 11.0, 7.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.517578125, -2.448455810546875, -2.37933349609375, -2.310211181640625, -2.2410888671875, -2.171966552734375, -2.10284423828125, -2.033721923828125, -1.964599609375, -1.895477294921875, -1.82635498046875, -1.757232666015625, -1.6881103515625, -1.618988037109375, -1.54986572265625, -1.480743408203125, -1.41162109375, -1.342498779296875, -1.27337646484375, -1.204254150390625, -1.1351318359375, -1.066009521484375, -0.99688720703125, -0.927764892578125, -0.858642578125, -0.789520263671875, -0.72039794921875, -0.651275634765625, -0.5821533203125, -0.513031005859375, -0.44390869140625, -0.374786376953125, -0.3056640625, -0.236541748046875, -0.16741943359375, -0.098297119140625, -0.0291748046875, 0.039947509765625, 0.10906982421875, 0.178192138671875, 0.247314453125, 0.316436767578125, 0.38555908203125, 0.454681396484375, 0.5238037109375, 0.592926025390625, 0.66204833984375, 0.731170654296875, 0.80029296875, 0.869415283203125, 0.93853759765625, 1.007659912109375, 1.0767822265625, 1.145904541015625, 1.21502685546875, 1.284149169921875, 1.353271484375, 1.422393798828125, 1.49151611328125, 1.560638427734375, 1.6297607421875, 1.698883056640625, 1.76800537109375, 1.837127685546875, 1.90625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 1.0, 5.0, 6.0, 6.0, 7.0, 18.0, 22.0, 29.0, 27.0, 38.0, 46.0, 61.0, 105.0, 200.0, 312.0, 673.0, 1589.0, 4740.0, 18763.0, 105875.0, 634696.0, 230904.0, 37720.0, 8288.0, 2395.0, 889.0, 437.0, 228.0, 140.0, 88.0, 63.0, 43.0, 36.0, 27.0, 14.0, 13.0, 13.0, 7.0, 9.0, 3.0, 4.0, 4.0, 5.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.26953125, -6.077880859375, -5.88623046875, -5.694580078125, -5.5029296875, -5.311279296875, -5.11962890625, -4.927978515625, -4.736328125, -4.544677734375, -4.35302734375, -4.161376953125, -3.9697265625, -3.778076171875, -3.58642578125, -3.394775390625, -3.203125, -3.011474609375, -2.81982421875, -2.628173828125, -2.4365234375, -2.244873046875, -2.05322265625, -1.861572265625, -1.669921875, -1.478271484375, -1.28662109375, -1.094970703125, -0.9033203125, -0.711669921875, -0.52001953125, -0.328369140625, -0.13671875, 0.054931640625, 0.24658203125, 0.438232421875, 0.6298828125, 0.821533203125, 1.01318359375, 1.204833984375, 1.396484375, 1.588134765625, 1.77978515625, 1.971435546875, 2.1630859375, 2.354736328125, 2.54638671875, 2.738037109375, 2.9296875, 3.121337890625, 3.31298828125, 3.504638671875, 3.6962890625, 3.887939453125, 4.07958984375, 4.271240234375, 4.462890625, 4.654541015625, 4.84619140625, 5.037841796875, 5.2294921875, 5.421142578125, 5.61279296875, 5.804443359375, 5.99609375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 10.0, 9.0, 16.0, 17.0, 17.0, 28.0, 48.0, 50.0, 42.0, 51.0, 68.0, 60.0, 74.0, 67.0, 64.0, 72.0, 45.0, 67.0, 35.0, 29.0, 31.0, 26.0, 22.0, 10.0, 14.0, 6.0, 8.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.0234375, -10.690185546875, -10.35693359375, -10.023681640625, -9.6904296875, -9.357177734375, -9.02392578125, -8.690673828125, -8.357421875, -8.024169921875, -7.69091796875, -7.357666015625, -7.0244140625, -6.691162109375, -6.35791015625, -6.024658203125, -5.69140625, -5.358154296875, -5.02490234375, -4.691650390625, -4.3583984375, -4.025146484375, -3.69189453125, -3.358642578125, -3.025390625, -2.692138671875, -2.35888671875, -2.025634765625, -1.6923828125, -1.359130859375, -1.02587890625, -0.692626953125, -0.359375, -0.026123046875, 0.30712890625, 0.640380859375, 0.9736328125, 1.306884765625, 1.64013671875, 1.973388671875, 2.306640625, 2.639892578125, 2.97314453125, 3.306396484375, 3.6396484375, 3.972900390625, 4.30615234375, 4.639404296875, 4.97265625, 5.305908203125, 5.63916015625, 5.972412109375, 6.3056640625, 6.638916015625, 6.97216796875, 7.305419921875, 7.638671875, 7.971923828125, 8.30517578125, 8.638427734375, 8.9716796875, 9.304931640625, 9.63818359375, 9.971435546875, 10.3046875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 9.0, 7.0, 7.0, 20.0, 44.0, 61.0, 75.0, 144.0, 264.0, 534.0, 1058.0, 2441.0, 6505.0, 19642.0, 72991.0, 304922.0, 515451.0, 88860.0, 22906.0, 7337.0, 2775.0, 1261.0, 594.0, 257.0, 164.0, 74.0, 49.0, 36.0, 23.0, 19.0, 10.0, 10.0, 3.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.755859375, -1.704315185546875, -1.65277099609375, -1.601226806640625, -1.5496826171875, -1.498138427734375, -1.44659423828125, -1.395050048828125, -1.343505859375, -1.291961669921875, -1.24041748046875, -1.188873291015625, -1.1373291015625, -1.085784912109375, -1.03424072265625, -0.982696533203125, -0.93115234375, -0.879608154296875, -0.82806396484375, -0.776519775390625, -0.7249755859375, -0.673431396484375, -0.62188720703125, -0.570343017578125, -0.518798828125, -0.467254638671875, -0.41571044921875, -0.364166259765625, -0.3126220703125, -0.261077880859375, -0.20953369140625, -0.157989501953125, -0.1064453125, -0.054901123046875, -0.00335693359375, 0.048187255859375, 0.0997314453125, 0.151275634765625, 0.20281982421875, 0.254364013671875, 0.305908203125, 0.357452392578125, 0.40899658203125, 0.460540771484375, 0.5120849609375, 0.563629150390625, 0.61517333984375, 0.666717529296875, 0.71826171875, 0.769805908203125, 0.82135009765625, 0.872894287109375, 0.9244384765625, 0.975982666015625, 1.02752685546875, 1.079071044921875, 1.130615234375, 1.182159423828125, 1.23370361328125, 1.285247802734375, 1.3367919921875, 1.388336181640625, 1.43988037109375, 1.491424560546875, 1.54296875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 4.0, 3.0, 6.0, 12.0, 9.0, 19.0, 22.0, 45.0, 73.0, 103.0, 156.0, 151.0, 124.0, 103.0, 59.0, 43.0, 21.0, 20.0, 10.0, 7.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00115966796875, -0.0011286139488220215, -0.001097559928894043, -0.0010665059089660645, -0.001035451889038086, -0.0010043978691101074, -0.0009733438491821289, -0.0009422898292541504, -0.0009112358093261719, -0.0008801817893981934, -0.0008491277694702148, -0.0008180737495422363, -0.0007870197296142578, -0.0007559657096862793, -0.0007249116897583008, -0.0006938576698303223, -0.0006628036499023438, -0.0006317496299743652, -0.0006006956100463867, -0.0005696415901184082, -0.0005385875701904297, -0.0005075335502624512, -0.00047647953033447266, -0.00044542551040649414, -0.0004143714904785156, -0.0003833174705505371, -0.0003522634506225586, -0.0003212094306945801, -0.00029015541076660156, -0.00025910139083862305, -0.00022804737091064453, -0.00019699335098266602, -0.0001659393310546875, -0.00013488531112670898, -0.00010383129119873047, -7.277727127075195e-05, -4.172325134277344e-05, -1.0669231414794922e-05, 2.0384788513183594e-05, 5.143880844116211e-05, 8.249282836914062e-05, 0.00011354684829711914, 0.00014460086822509766, 0.00017565488815307617, 0.0002067089080810547, 0.0002377629280090332, 0.0002688169479370117, 0.00029987096786499023, 0.00033092498779296875, 0.00036197900772094727, 0.0003930330276489258, 0.0004240870475769043, 0.0004551410675048828, 0.00048619508743286133, 0.0005172491073608398, 0.0005483031272888184, 0.0005793571472167969, 0.0006104111671447754, 0.0006414651870727539, 0.0006725192070007324, 0.0007035732269287109, 0.0007346272468566895, 0.000765681266784668, 0.0007967352867126465, 0.000827789306640625]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 8.0, 6.0, 5.0, 7.0, 14.0, 18.0, 28.0, 53.0, 102.0, 145.0, 234.0, 475.0, 983.0, 2501.0, 7950.0, 30130.0, 144794.0, 614840.0, 191737.0, 39347.0, 9770.0, 3138.0, 1108.0, 524.0, 257.0, 146.0, 74.0, 43.0, 33.0, 34.0, 11.0, 9.0, 11.0, 8.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-2.119140625, -2.0642242431640625, -2.009307861328125, -1.9543914794921875, -1.89947509765625, -1.8445587158203125, -1.789642333984375, -1.7347259521484375, -1.6798095703125, -1.6248931884765625, -1.569976806640625, -1.5150604248046875, -1.46014404296875, -1.4052276611328125, -1.350311279296875, -1.2953948974609375, -1.240478515625, -1.1855621337890625, -1.130645751953125, -1.0757293701171875, -1.02081298828125, -0.9658966064453125, -0.910980224609375, -0.8560638427734375, -0.8011474609375, -0.7462310791015625, -0.691314697265625, -0.6363983154296875, -0.58148193359375, -0.5265655517578125, -0.471649169921875, -0.4167327880859375, -0.36181640625, -0.3069000244140625, -0.251983642578125, -0.1970672607421875, -0.14215087890625, -0.0872344970703125, -0.032318115234375, 0.0225982666015625, 0.0775146484375, 0.1324310302734375, 0.187347412109375, 0.2422637939453125, 0.29718017578125, 0.3520965576171875, 0.407012939453125, 0.4619293212890625, 0.516845703125, 0.5717620849609375, 0.626678466796875, 0.6815948486328125, 0.73651123046875, 0.7914276123046875, 0.846343994140625, 0.9012603759765625, 0.9561767578125, 1.0110931396484375, 1.066009521484375, 1.1209259033203125, 1.17584228515625, 1.2307586669921875, 1.285675048828125, 1.3405914306640625, 1.3955078125]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 5.0, 17.0, 13.0, 14.0, 24.0, 31.0, 43.0, 51.0, 52.0, 56.0, 80.0, 74.0, 82.0, 87.0, 66.0, 64.0, 44.0, 45.0, 29.0, 26.0, 28.0, 19.0, 16.0, 12.0, 6.0, 2.0, 5.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2.498046875, -2.43719482421875, -2.3763427734375, -2.31549072265625, -2.254638671875, -2.19378662109375, -2.1329345703125, -2.07208251953125, -2.01123046875, -1.95037841796875, -1.8895263671875, -1.82867431640625, -1.767822265625, -1.70697021484375, -1.6461181640625, -1.58526611328125, -1.5244140625, -1.46356201171875, -1.4027099609375, -1.34185791015625, -1.281005859375, -1.22015380859375, -1.1593017578125, -1.09844970703125, -1.03759765625, -0.97674560546875, -0.9158935546875, -0.85504150390625, -0.794189453125, -0.73333740234375, -0.6724853515625, -0.61163330078125, -0.55078125, -0.48992919921875, -0.4290771484375, -0.36822509765625, -0.307373046875, -0.24652099609375, -0.1856689453125, -0.12481689453125, -0.06396484375, -0.00311279296875, 0.0577392578125, 0.11859130859375, 0.179443359375, 0.24029541015625, 0.3011474609375, 0.36199951171875, 0.4228515625, 0.48370361328125, 0.5445556640625, 0.60540771484375, 0.666259765625, 0.72711181640625, 0.7879638671875, 0.84881591796875, 0.90966796875, 0.97052001953125, 1.0313720703125, 1.09222412109375, 1.153076171875, 1.21392822265625, 1.2747802734375, 1.33563232421875, 1.396484375]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 7.0, 12.0, 17.0, 35.0, 57.0, 123.0, 248.0, 264.0, 105.0, 70.0, 32.0, 20.0, 8.0, 6.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.70728302001953, -72.79360961914062, -70.87992858886719, -68.96625518798828, -67.05257415771484, -65.13890075683594, -63.225223541259766, -61.311546325683594, -59.39786911010742, -57.48419189453125, -55.57051467895508, -53.656837463378906, -51.7431640625, -49.82948303222656, -47.915809631347656, -46.002132415771484, -44.08845520019531, -42.17477798461914, -40.26110076904297, -38.3474235534668, -36.433746337890625, -34.52007293701172, -32.60639572143555, -30.692718505859375, -28.779041290283203, -26.86536407470703, -24.95168685913086, -23.03801155090332, -21.12433433532715, -19.210657119750977, -17.296981811523438, -15.383304595947266, -13.469627380371094, -11.555950164794922, -9.642273902893066, -7.728597164154053, -5.814920425415039, -3.901243209838867, -1.9875669479370117, -0.07389068603515625, 1.8397865295410156, 3.7534632682800293, 5.667140007019043, 7.580816745758057, 9.49449348449707, 11.408170700073242, 13.321846961975098, 15.235523223876953, 17.149200439453125, 19.062877655029297, 20.97655487060547, 22.890230178833008, 24.80390739440918, 26.71758460998535, 28.63125991821289, 30.544937133789062, 32.458614349365234, 34.372291564941406, 36.28596878051758, 38.19964599609375, 40.113319396972656, 42.027000427246094, 43.940673828125, 45.85435104370117, 47.768028259277344]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 5.0, 5.0, 5.0, 6.0, 3.0, 7.0, 10.0, 17.0, 16.0, 19.0, 18.0, 19.0, 23.0, 23.0, 41.0, 37.0, 41.0, 26.0, 53.0, 87.0, 96.0, 68.0, 63.0, 42.0, 38.0, 34.0, 31.0, 31.0, 24.0, 24.0, 10.0, 21.0, 15.0, 5.0, 8.0, 11.0, 8.0, 2.0, 8.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.77023696899414, -32.593143463134766, -31.416048049926758, -30.23895263671875, -29.061859130859375, -27.884763717651367, -26.70766830444336, -25.530574798583984, -24.353479385375977, -23.17638397216797, -21.999290466308594, -20.822195053100586, -19.645099639892578, -18.468006134033203, -17.290910720825195, -16.113815307617188, -14.936721801757812, -13.759627342224121, -12.58253288269043, -11.405437469482422, -10.22834300994873, -9.051248550415039, -7.8741536140441895, -6.69705867767334, -5.519964218139648, -4.342869758605957, -3.1657748222351074, -1.988680124282837, -0.8115854263305664, 0.365509033203125, 1.5426039695739746, 2.719698905944824, 3.89678955078125, 5.073884010314941, 6.250978946685791, 7.428073883056641, 8.605168342590332, 9.782262802124023, 10.959358215332031, 12.136452674865723, 13.313547134399414, 14.490641593933105, 15.667736053466797, 16.844831466674805, 18.021926879882812, 19.199020385742188, 20.376115798950195, 21.553211212158203, 22.730304718017578, 23.907400131225586, 25.08449363708496, 26.26158905029297, 27.438682556152344, 28.61577796936035, 29.79287338256836, 30.969966888427734, 32.147064208984375, 33.32415771484375, 34.50125503540039, 35.678348541259766, 36.85544204711914, 38.03253936767578, 39.209632873535156, 40.38672637939453, 41.563819885253906]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 0.0, 3.0, 3.0, 4.0, 4.0, 8.0, 7.0, 3.0, 15.0, 18.0, 25.0, 34.0, 27.0, 44.0, 90.0, 107.0, 164.0, 358.0, 687.0, 1568.0, 4333.0, 13252.0, 53521.0, 274154.0, 1391495.0, 1891861.0, 446760.0, 85252.0, 20256.0, 6007.0, 2278.0, 904.0, 425.0, 228.0, 110.0, 75.0, 52.0, 41.0, 33.0, 23.0, 14.0, 9.0, 9.0, 6.0, 6.0, 5.0, 6.0, 1.0, 3.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.40234375, -2.327606201171875, -2.25286865234375, -2.178131103515625, -2.1033935546875, -2.028656005859375, -1.95391845703125, -1.879180908203125, -1.804443359375, -1.729705810546875, -1.65496826171875, -1.580230712890625, -1.5054931640625, -1.430755615234375, -1.35601806640625, -1.281280517578125, -1.20654296875, -1.131805419921875, -1.05706787109375, -0.982330322265625, -0.9075927734375, -0.832855224609375, -0.75811767578125, -0.683380126953125, -0.608642578125, -0.533905029296875, -0.45916748046875, -0.384429931640625, -0.3096923828125, -0.234954833984375, -0.16021728515625, -0.085479736328125, -0.0107421875, 0.063995361328125, 0.13873291015625, 0.213470458984375, 0.2882080078125, 0.362945556640625, 0.43768310546875, 0.512420654296875, 0.587158203125, 0.661895751953125, 0.73663330078125, 0.811370849609375, 0.8861083984375, 0.960845947265625, 1.03558349609375, 1.110321044921875, 1.18505859375, 1.259796142578125, 1.33453369140625, 1.409271240234375, 1.4840087890625, 1.558746337890625, 1.63348388671875, 1.708221435546875, 1.782958984375, 1.857696533203125, 1.93243408203125, 2.007171630859375, 2.0819091796875, 2.156646728515625, 2.23138427734375, 2.306121826171875, 2.380859375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 5.0, 7.0, 8.0, 7.0, 13.0, 8.0, 21.0, 25.0, 19.0, 30.0, 39.0, 37.0, 41.0, 48.0, 38.0, 57.0, 66.0, 56.0, 50.0, 61.0, 46.0, 40.0, 54.0, 38.0, 40.0, 30.0, 21.0, 24.0, 18.0, 15.0, 11.0, 11.0, 9.0, 5.0, 6.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.720703125, -2.637176513671875, -2.55364990234375, -2.470123291015625, -2.3865966796875, -2.303070068359375, -2.21954345703125, -2.136016845703125, -2.052490234375, -1.968963623046875, -1.88543701171875, -1.801910400390625, -1.7183837890625, -1.634857177734375, -1.55133056640625, -1.467803955078125, -1.38427734375, -1.300750732421875, -1.21722412109375, -1.133697509765625, -1.0501708984375, -0.966644287109375, -0.88311767578125, -0.799591064453125, -0.716064453125, -0.632537841796875, -0.54901123046875, -0.465484619140625, -0.3819580078125, -0.298431396484375, -0.21490478515625, -0.131378173828125, -0.0478515625, 0.035675048828125, 0.11920166015625, 0.202728271484375, 0.2862548828125, 0.369781494140625, 0.45330810546875, 0.536834716796875, 0.620361328125, 0.703887939453125, 0.78741455078125, 0.870941162109375, 0.9544677734375, 1.037994384765625, 1.12152099609375, 1.205047607421875, 1.28857421875, 1.372100830078125, 1.45562744140625, 1.539154052734375, 1.6226806640625, 1.706207275390625, 1.78973388671875, 1.873260498046875, 1.956787109375, 2.040313720703125, 2.12384033203125, 2.207366943359375, 2.2908935546875, 2.374420166015625, 2.45794677734375, 2.541473388671875, 2.625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 4.0, 6.0, 10.0, 9.0, 23.0, 26.0, 50.0, 93.0, 154.0, 276.0, 618.0, 2039.0, 11298.0, 173000.0, 3722859.0, 265012.0, 14837.0, 2505.0, 758.0, 313.0, 150.0, 104.0, 48.0, 34.0, 19.0, 9.0, 9.0, 5.0, 5.0, 6.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.703125, -6.5091552734375, -6.315185546875, -6.1212158203125, -5.92724609375, -5.7332763671875, -5.539306640625, -5.3453369140625, -5.1513671875, -4.9573974609375, -4.763427734375, -4.5694580078125, -4.37548828125, -4.1815185546875, -3.987548828125, -3.7935791015625, -3.599609375, -3.4056396484375, -3.211669921875, -3.0177001953125, -2.82373046875, -2.6297607421875, -2.435791015625, -2.2418212890625, -2.0478515625, -1.8538818359375, -1.659912109375, -1.4659423828125, -1.27197265625, -1.0780029296875, -0.884033203125, -0.6900634765625, -0.49609375, -0.3021240234375, -0.108154296875, 0.0858154296875, 0.27978515625, 0.4737548828125, 0.667724609375, 0.8616943359375, 1.0556640625, 1.2496337890625, 1.443603515625, 1.6375732421875, 1.83154296875, 2.0255126953125, 2.219482421875, 2.4134521484375, 2.607421875, 2.8013916015625, 2.995361328125, 3.1893310546875, 3.38330078125, 3.5772705078125, 3.771240234375, 3.9652099609375, 4.1591796875, 4.3531494140625, 4.547119140625, 4.7410888671875, 4.93505859375, 5.1290283203125, 5.322998046875, 5.5169677734375, 5.7109375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 5.0, 7.0, 10.0, 29.0, 36.0, 51.0, 70.0, 100.0, 221.0, 360.0, 611.0, 780.0, 679.0, 433.0, 270.0, 162.0, 93.0, 53.0, 40.0, 18.0, 9.0, 11.0, 9.0, 5.0, 3.0, 6.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.1796875, -6.0162353515625, -5.852783203125, -5.6893310546875, -5.52587890625, -5.3624267578125, -5.198974609375, -5.0355224609375, -4.8720703125, -4.7086181640625, -4.545166015625, -4.3817138671875, -4.21826171875, -4.0548095703125, -3.891357421875, -3.7279052734375, -3.564453125, -3.4010009765625, -3.237548828125, -3.0740966796875, -2.91064453125, -2.7471923828125, -2.583740234375, -2.4202880859375, -2.2568359375, -2.0933837890625, -1.929931640625, -1.7664794921875, -1.60302734375, -1.4395751953125, -1.276123046875, -1.1126708984375, -0.94921875, -0.7857666015625, -0.622314453125, -0.4588623046875, -0.29541015625, -0.1319580078125, 0.031494140625, 0.1949462890625, 0.3583984375, 0.5218505859375, 0.685302734375, 0.8487548828125, 1.01220703125, 1.1756591796875, 1.339111328125, 1.5025634765625, 1.666015625, 1.8294677734375, 1.992919921875, 2.1563720703125, 2.31982421875, 2.4832763671875, 2.646728515625, 2.8101806640625, 2.9736328125, 3.1370849609375, 3.300537109375, 3.4639892578125, 3.62744140625, 3.7908935546875, 3.954345703125, 4.1177978515625, 4.28125]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 5.0, 4.0, 25.0, 102.0, 347.0, 367.0, 108.0, 34.0, 11.0, 3.0, 2.0, 1.0, 1.0, 0.0, 3.0], "bins": [-141.87994384765625, -139.25193786621094, -136.62393188476562, -133.9959259033203, -131.36793518066406, -128.73992919921875, -126.11192321777344, -123.48391723632812, -120.85591125488281, -118.2279052734375, -115.59990692138672, -112.9719009399414, -110.3438949584961, -107.71589660644531, -105.087890625, -102.45988464355469, -99.8318862915039, -97.2038803100586, -94.57588195800781, -91.9478759765625, -89.31986999511719, -86.69186401367188, -84.0638656616211, -81.43585968017578, -78.807861328125, -76.17985534667969, -73.5518569946289, -70.9238510131836, -68.29584503173828, -65.6678466796875, -63.03984069824219, -60.411834716796875, -57.78383255004883, -55.15583038330078, -52.52782440185547, -49.89982223510742, -47.271820068359375, -44.64381408691406, -42.015811920166016, -39.38780975341797, -36.759803771972656, -34.13180160522461, -31.503795623779297, -28.87579345703125, -26.24778938293457, -23.61978530883789, -20.991783142089844, -18.363779067993164, -15.735774993896484, -13.107770919799805, -10.479767799377441, -7.85176420211792, -5.223760604858398, -2.5957565307617188, 0.03224658966064453, 2.660249710083008, 5.2882537841796875, 7.916257381439209, 10.54426097869873, 13.172264099121094, 15.800268173217773, 18.428272247314453, 21.0562744140625, 23.68427848815918, 26.31228256225586]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 5.0, 2.0, 2.0, 5.0, 4.0, 10.0, 7.0, 8.0, 8.0, 9.0, 13.0, 16.0, 20.0, 26.0, 39.0, 27.0, 25.0, 38.0, 31.0, 41.0, 36.0, 31.0, 39.0, 37.0, 32.0, 40.0, 38.0, 42.0, 47.0, 30.0, 43.0, 36.0, 22.0, 33.0, 21.0, 21.0, 17.0, 17.0, 17.0, 12.0, 16.0, 7.0, 8.0, 9.0, 5.0, 7.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-17.322376251220703, -16.767051696777344, -16.211727142333984, -15.656401634216309, -15.101076126098633, -14.545751571655273, -13.990427017211914, -13.435101509094238, -12.879776000976562, -12.324451446533203, -11.769125938415527, -11.213801383972168, -10.658475875854492, -10.103151321411133, -9.547826766967773, -8.992501258850098, -8.437176704406738, -7.881851673126221, -7.326526641845703, -6.771202087402344, -6.215876579284668, -5.660552024841309, -5.105226993560791, -4.549901962280273, -3.994576930999756, -3.4392518997192383, -2.8839268684387207, -2.3286020755767822, -1.7732770442962646, -1.217952013015747, -0.6626272201538086, -0.10730218887329102, 0.44802284240722656, 1.0033478736877441, 1.5586727857589722, 2.1139976978302, 2.6693227291107178, 3.2246477603912354, 3.779972553253174, 4.335297584533691, 4.890622615814209, 5.445947647094727, 6.001272678375244, 6.556597709655762, 7.111922264099121, 7.667247772216797, 8.222572326660156, 8.777896881103516, 9.333222389221191, 9.88854694366455, 10.443872451782227, 10.999197006225586, 11.554522514343262, 12.109847068786621, 12.665172576904297, 13.220497131347656, 13.775821685791016, 14.331146240234375, 14.88647174835205, 15.44179630279541, 15.997121810913086, 16.552446365356445, 17.107770919799805, 17.663097381591797, 18.218421936035156]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 2.0, 3.0, 6.0, 11.0, 11.0, 25.0, 24.0, 39.0, 62.0, 88.0, 129.0, 163.0, 252.0, 417.0, 591.0, 923.0, 1544.0, 2569.0, 4518.0, 7621.0, 13656.0, 24427.0, 44357.0, 78863.0, 140192.0, 210912.0, 206588.0, 136566.0, 76868.0, 42226.0, 23543.0, 13028.0, 7308.0, 4306.0, 2609.0, 1446.0, 913.0, 570.0, 378.0, 234.0, 179.0, 121.0, 79.0, 67.0, 44.0, 39.0, 13.0, 11.0, 8.0, 1.0, 5.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.763671875, -1.702789306640625, -1.64190673828125, -1.581024169921875, -1.5201416015625, -1.459259033203125, -1.39837646484375, -1.337493896484375, -1.276611328125, -1.215728759765625, -1.15484619140625, -1.093963623046875, -1.0330810546875, -0.972198486328125, -0.91131591796875, -0.850433349609375, -0.78955078125, -0.728668212890625, -0.66778564453125, -0.606903076171875, -0.5460205078125, -0.485137939453125, -0.42425537109375, -0.363372802734375, -0.302490234375, -0.241607666015625, -0.18072509765625, -0.119842529296875, -0.0589599609375, 0.001922607421875, 0.06280517578125, 0.123687744140625, 0.1845703125, 0.245452880859375, 0.30633544921875, 0.367218017578125, 0.4281005859375, 0.488983154296875, 0.54986572265625, 0.610748291015625, 0.671630859375, 0.732513427734375, 0.79339599609375, 0.854278564453125, 0.9151611328125, 0.976043701171875, 1.03692626953125, 1.097808837890625, 1.15869140625, 1.219573974609375, 1.28045654296875, 1.341339111328125, 1.4022216796875, 1.463104248046875, 1.52398681640625, 1.584869384765625, 1.645751953125, 1.706634521484375, 1.76751708984375, 1.828399658203125, 1.8892822265625, 1.950164794921875, 2.01104736328125, 2.071929931640625, 2.1328125]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 4.0, 10.0, 8.0, 5.0, 16.0, 13.0, 16.0, 12.0, 28.0, 33.0, 39.0, 43.0, 44.0, 40.0, 50.0, 36.0, 42.0, 48.0, 54.0, 54.0, 56.0, 55.0, 38.0, 41.0, 55.0, 40.0, 22.0, 25.0, 14.0, 10.0, 8.0, 5.0, 15.0, 9.0, 6.0, 9.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.75, -2.6708984375, -2.591796875, -2.5126953125, -2.43359375, -2.3544921875, -2.275390625, -2.1962890625, -2.1171875, -2.0380859375, -1.958984375, -1.8798828125, -1.80078125, -1.7216796875, -1.642578125, -1.5634765625, -1.484375, -1.4052734375, -1.326171875, -1.2470703125, -1.16796875, -1.0888671875, -1.009765625, -0.9306640625, -0.8515625, -0.7724609375, -0.693359375, -0.6142578125, -0.53515625, -0.4560546875, -0.376953125, -0.2978515625, -0.21875, -0.1396484375, -0.060546875, 0.0185546875, 0.09765625, 0.1767578125, 0.255859375, 0.3349609375, 0.4140625, 0.4931640625, 0.572265625, 0.6513671875, 0.73046875, 0.8095703125, 0.888671875, 0.9677734375, 1.046875, 1.1259765625, 1.205078125, 1.2841796875, 1.36328125, 1.4423828125, 1.521484375, 1.6005859375, 1.6796875, 1.7587890625, 1.837890625, 1.9169921875, 1.99609375, 2.0751953125, 2.154296875, 2.2333984375, 2.3125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 5.0, 7.0, 8.0, 9.0, 14.0, 17.0, 20.0, 35.0, 56.0, 74.0, 134.0, 221.0, 310.0, 526.0, 996.0, 2454.0, 9323.0, 57389.0, 644622.0, 286915.0, 34908.0, 6432.0, 1925.0, 830.0, 477.0, 292.0, 185.0, 125.0, 71.0, 43.0, 43.0, 28.0, 17.0, 12.0, 13.0, 6.0, 7.0, 6.0, 3.0, 2.0, 2.0, 2.0], "bins": [-8.328125, -8.1243896484375, -7.920654296875, -7.7169189453125, -7.51318359375, -7.3094482421875, -7.105712890625, -6.9019775390625, -6.6982421875, -6.4945068359375, -6.290771484375, -6.0870361328125, -5.88330078125, -5.6795654296875, -5.475830078125, -5.2720947265625, -5.068359375, -4.8646240234375, -4.660888671875, -4.4571533203125, -4.25341796875, -4.0496826171875, -3.845947265625, -3.6422119140625, -3.4384765625, -3.2347412109375, -3.031005859375, -2.8272705078125, -2.62353515625, -2.4197998046875, -2.216064453125, -2.0123291015625, -1.80859375, -1.6048583984375, -1.401123046875, -1.1973876953125, -0.99365234375, -0.7899169921875, -0.586181640625, -0.3824462890625, -0.1787109375, 0.0250244140625, 0.228759765625, 0.4324951171875, 0.63623046875, 0.8399658203125, 1.043701171875, 1.2474365234375, 1.451171875, 1.6549072265625, 1.858642578125, 2.0623779296875, 2.26611328125, 2.4698486328125, 2.673583984375, 2.8773193359375, 3.0810546875, 3.2847900390625, 3.488525390625, 3.6922607421875, 3.89599609375, 4.0997314453125, 4.303466796875, 4.5072021484375, 4.7109375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 12.0, 10.0, 18.0, 18.0, 26.0, 24.0, 36.0, 30.0, 31.0, 43.0, 67.0, 76.0, 65.0, 77.0, 68.0, 49.0, 69.0, 53.0, 35.0, 35.0, 30.0, 23.0, 24.0, 18.0, 19.0, 12.0, 7.0, 8.0, 2.0, 5.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.734375, -10.41552734375, -10.0966796875, -9.77783203125, -9.458984375, -9.14013671875, -8.8212890625, -8.50244140625, -8.18359375, -7.86474609375, -7.5458984375, -7.22705078125, -6.908203125, -6.58935546875, -6.2705078125, -5.95166015625, -5.6328125, -5.31396484375, -4.9951171875, -4.67626953125, -4.357421875, -4.03857421875, -3.7197265625, -3.40087890625, -3.08203125, -2.76318359375, -2.4443359375, -2.12548828125, -1.806640625, -1.48779296875, -1.1689453125, -0.85009765625, -0.53125, -0.21240234375, 0.1064453125, 0.42529296875, 0.744140625, 1.06298828125, 1.3818359375, 1.70068359375, 2.01953125, 2.33837890625, 2.6572265625, 2.97607421875, 3.294921875, 3.61376953125, 3.9326171875, 4.25146484375, 4.5703125, 4.88916015625, 5.2080078125, 5.52685546875, 5.845703125, 6.16455078125, 6.4833984375, 6.80224609375, 7.12109375, 7.43994140625, 7.7587890625, 8.07763671875, 8.396484375, 8.71533203125, 9.0341796875, 9.35302734375, 9.671875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 1.0, 5.0, 4.0, 8.0, 8.0, 13.0, 13.0, 28.0, 33.0, 50.0, 67.0, 88.0, 112.0, 183.0, 299.0, 537.0, 907.0, 1783.0, 3736.0, 8627.0, 22687.0, 66053.0, 229698.0, 555027.0, 102880.0, 32852.0, 12311.0, 5155.0, 2372.0, 1168.0, 693.0, 430.0, 208.0, 139.0, 105.0, 72.0, 46.0, 48.0, 26.0, 25.0, 13.0, 13.0, 10.0, 3.0, 7.0, 6.0, 1.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0869140625, -1.05206298828125, -1.0172119140625, -0.98236083984375, -0.947509765625, -0.91265869140625, -0.8778076171875, -0.84295654296875, -0.80810546875, -0.77325439453125, -0.7384033203125, -0.70355224609375, -0.668701171875, -0.63385009765625, -0.5989990234375, -0.56414794921875, -0.529296875, -0.49444580078125, -0.4595947265625, -0.42474365234375, -0.389892578125, -0.35504150390625, -0.3201904296875, -0.28533935546875, -0.25048828125, -0.21563720703125, -0.1807861328125, -0.14593505859375, -0.111083984375, -0.07623291015625, -0.0413818359375, -0.00653076171875, 0.0283203125, 0.06317138671875, 0.0980224609375, 0.13287353515625, 0.167724609375, 0.20257568359375, 0.2374267578125, 0.27227783203125, 0.30712890625, 0.34197998046875, 0.3768310546875, 0.41168212890625, 0.446533203125, 0.48138427734375, 0.5162353515625, 0.55108642578125, 0.5859375, 0.62078857421875, 0.6556396484375, 0.69049072265625, 0.725341796875, 0.76019287109375, 0.7950439453125, 0.82989501953125, 0.86474609375, 0.89959716796875, 0.9344482421875, 0.96929931640625, 1.004150390625, 1.03900146484375, 1.0738525390625, 1.10870361328125, 1.1435546875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 5.0, 5.0, 5.0, 4.0, 9.0, 7.0, 15.0, 14.0, 18.0, 30.0, 17.0, 49.0, 48.0, 78.0, 92.0, 99.0, 98.0, 83.0, 70.0, 57.0, 45.0, 38.0, 28.0, 16.0, 15.0, 16.0, 9.0, 9.0, 2.0, 7.0, 3.0, 5.0, 4.0, 2.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005331039428710938, -0.000517476350069046, -0.0005018487572669983, -0.00048622116446495056, -0.00047059357166290283, -0.0004549659788608551, -0.0004393383860588074, -0.00042371079325675964, -0.0004080832004547119, -0.0003924556076526642, -0.00037682801485061646, -0.0003612004220485687, -0.000345572829246521, -0.00032994523644447327, -0.00031431764364242554, -0.0002986900508403778, -0.0002830624580383301, -0.00026743486523628235, -0.0002518072724342346, -0.0002361796796321869, -0.00022055208683013916, -0.00020492449402809143, -0.0001892969012260437, -0.00017366930842399597, -0.00015804171562194824, -0.0001424141228199005, -0.00012678653001785278, -0.00011115893721580505, -9.553134441375732e-05, -7.99037516117096e-05, -6.427615880966187e-05, -4.8648566007614136e-05, -3.3020973205566406e-05, -1.7393380403518677e-05, -1.7657876014709473e-06, 1.3861805200576782e-05, 2.9489398002624512e-05, 4.511699080467224e-05, 6.074458360671997e-05, 7.63721764087677e-05, 9.199976921081543e-05, 0.00010762736201286316, 0.0001232549548149109, 0.00013888254761695862, 0.00015451014041900635, 0.00017013773322105408, 0.0001857653260231018, 0.00020139291882514954, 0.00021702051162719727, 0.000232648104429245, 0.0002482756972312927, 0.00026390329003334045, 0.0002795308828353882, 0.0002951584756374359, 0.00031078606843948364, 0.00032641366124153137, 0.0003420412540435791, 0.00035766884684562683, 0.00037329643964767456, 0.0003889240324497223, 0.00040455162525177, 0.00042017921805381775, 0.0004358068108558655, 0.0004514344036579132, 0.00046706199645996094]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 7.0, 6.0, 11.0, 15.0, 18.0, 15.0, 48.0, 56.0, 75.0, 118.0, 164.0, 260.0, 505.0, 980.0, 1986.0, 4697.0, 13034.0, 40416.0, 148313.0, 611522.0, 160091.0, 43048.0, 13650.0, 5046.0, 2086.0, 1040.0, 501.0, 287.0, 210.0, 122.0, 77.0, 38.0, 36.0, 26.0, 11.0, 12.0, 10.0, 13.0, 5.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.99267578125, -0.9552536010742188, -0.9178314208984375, -0.8804092407226562, -0.842987060546875, -0.8055648803710938, -0.7681427001953125, -0.7307205200195312, -0.69329833984375, -0.6558761596679688, -0.6184539794921875, -0.5810317993164062, -0.543609619140625, -0.5061874389648438, -0.4687652587890625, -0.43134307861328125, -0.3939208984375, -0.35649871826171875, -0.3190765380859375, -0.28165435791015625, -0.244232177734375, -0.20680999755859375, -0.1693878173828125, -0.13196563720703125, -0.09454345703125, -0.05712127685546875, -0.0196990966796875, 0.01772308349609375, 0.055145263671875, 0.09256744384765625, 0.1299896240234375, 0.16741180419921875, 0.204833984375, 0.24225616455078125, 0.2796783447265625, 0.31710052490234375, 0.354522705078125, 0.39194488525390625, 0.4293670654296875, 0.46678924560546875, 0.50421142578125, 0.5416336059570312, 0.5790557861328125, 0.6164779663085938, 0.653900146484375, 0.6913223266601562, 0.7287445068359375, 0.7661666870117188, 0.8035888671875, 0.8410110473632812, 0.8784332275390625, 0.9158554077148438, 0.953277587890625, 0.9906997680664062, 1.0281219482421875, 1.0655441284179688, 1.10296630859375, 1.1403884887695312, 1.1778106689453125, 1.2152328491210938, 1.252655029296875, 1.2900772094726562, 1.3274993896484375, 1.3649215698242188, 1.40234375]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 5.0, 3.0, 4.0, 5.0, 6.0, 8.0, 10.0, 11.0, 15.0, 21.0, 23.0, 36.0, 38.0, 59.0, 61.0, 73.0, 77.0, 81.0, 73.0, 72.0, 54.0, 61.0, 41.0, 38.0, 40.0, 24.0, 16.0, 20.0, 10.0, 7.0, 8.0, 4.0, 7.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.87890625, -1.832489013671875, -1.78607177734375, -1.739654541015625, -1.6932373046875, -1.646820068359375, -1.60040283203125, -1.553985595703125, -1.507568359375, -1.461151123046875, -1.41473388671875, -1.368316650390625, -1.3218994140625, -1.275482177734375, -1.22906494140625, -1.182647705078125, -1.13623046875, -1.089813232421875, -1.04339599609375, -0.996978759765625, -0.9505615234375, -0.904144287109375, -0.85772705078125, -0.811309814453125, -0.764892578125, -0.718475341796875, -0.67205810546875, -0.625640869140625, -0.5792236328125, -0.532806396484375, -0.48638916015625, -0.439971923828125, -0.3935546875, -0.347137451171875, -0.30072021484375, -0.254302978515625, -0.2078857421875, -0.161468505859375, -0.11505126953125, -0.068634033203125, -0.022216796875, 0.024200439453125, 0.07061767578125, 0.117034912109375, 0.1634521484375, 0.209869384765625, 0.25628662109375, 0.302703857421875, 0.34912109375, 0.395538330078125, 0.44195556640625, 0.488372802734375, 0.5347900390625, 0.581207275390625, 0.62762451171875, 0.674041748046875, 0.720458984375, 0.766876220703125, 0.81329345703125, 0.859710693359375, 0.9061279296875, 0.952545166015625, 0.99896240234375, 1.045379638671875, 1.091796875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 19.0, 35.0, 93.0, 191.0, 361.0, 157.0, 77.0, 36.0, 21.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-65.68341064453125, -63.874114990234375, -62.0648193359375, -60.255523681640625, -58.44622802734375, -56.636932373046875, -54.82763671875, -53.018341064453125, -51.20904541015625, -49.399749755859375, -47.5904541015625, -45.781158447265625, -43.97186279296875, -42.162567138671875, -40.353271484375, -38.543975830078125, -36.734676361083984, -34.92538070678711, -33.116085052490234, -31.30678939819336, -29.497493743896484, -27.68819808959961, -25.8789005279541, -24.069604873657227, -22.26030921936035, -20.451013565063477, -18.6417179107666, -16.832420349121094, -15.023125648498535, -13.21382999420166, -11.404533386230469, -9.595237731933594, -7.785942077636719, -5.976646423339844, -4.1673502922058105, -2.3580541610717773, -0.5487585067749023, 1.2605371475219727, 3.069833755493164, 4.879129409790039, 6.688425064086914, 8.497720718383789, 10.307016372680664, 12.116312980651855, 13.92560863494873, 15.734904289245605, 17.544200897216797, 19.353496551513672, 21.162792205810547, 22.972087860107422, 24.781383514404297, 26.590679168701172, 28.399974822998047, 30.209270477294922, 32.01856994628906, 33.82786560058594, 35.63716125488281, 37.44645690917969, 39.25575256347656, 41.06504821777344, 42.87434387207031, 44.68363952636719, 46.49293518066406, 48.30223083496094, 50.11152648925781]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 0.0, 3.0, 2.0, 5.0, 6.0, 13.0, 8.0, 9.0, 17.0, 15.0, 21.0, 22.0, 28.0, 22.0, 26.0, 29.0, 33.0, 42.0, 54.0, 104.0, 121.0, 66.0, 55.0, 32.0, 39.0, 33.0, 30.0, 22.0, 23.0, 22.0, 10.0, 18.0, 12.0, 12.0, 15.0, 6.0, 11.0, 2.0, 5.0, 9.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-33.92973327636719, -32.90850830078125, -31.887279510498047, -30.866052627563477, -29.844825744628906, -28.823598861694336, -27.802371978759766, -26.781147003173828, -25.759918212890625, -24.738691329956055, -23.717464447021484, -22.696237564086914, -21.675010681152344, -20.653783798217773, -19.632556915283203, -18.611331939697266, -17.590105056762695, -16.568878173828125, -15.547651290893555, -14.526424407958984, -13.505197525024414, -12.483970642089844, -11.46274471282959, -10.44151782989502, -9.42029094696045, -8.399064064025879, -7.377837181091309, -6.3566107749938965, -5.335383892059326, -4.314157009124756, -3.2929306030273438, -2.2717037200927734, -1.2504749298095703, -0.22924816608428955, 0.7919785976409912, 1.8132052421569824, 2.8344321250915527, 3.855659008026123, 4.876885414123535, 5.8981122970581055, 6.919339179992676, 7.940566062927246, 8.961792945861816, 9.98301887512207, 11.00424575805664, 12.025472640991211, 13.046699523925781, 14.067926406860352, 15.089153289794922, 16.110380172729492, 17.131607055664062, 18.152833938598633, 19.174060821533203, 20.195287704467773, 21.216514587402344, 22.23773956298828, 23.258968353271484, 24.280195236206055, 25.301422119140625, 26.322649002075195, 27.343875885009766, 28.365102767944336, 29.386329650878906, 30.407554626464844, 31.428781509399414]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 8.0, 4.0, 9.0, 11.0, 11.0, 25.0, 24.0, 39.0, 43.0, 76.0, 128.0, 203.0, 462.0, 977.0, 2488.0, 6905.0, 23785.0, 118012.0, 708735.0, 2169764.0, 942975.0, 171949.0, 33236.0, 8912.0, 3075.0, 1184.0, 559.0, 277.0, 143.0, 75.0, 53.0, 37.0, 25.0, 14.0, 15.0, 17.0, 9.0, 6.0, 4.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-2.76953125, -2.69384765625, -2.6181640625, -2.54248046875, -2.466796875, -2.39111328125, -2.3154296875, -2.23974609375, -2.1640625, -2.08837890625, -2.0126953125, -1.93701171875, -1.861328125, -1.78564453125, -1.7099609375, -1.63427734375, -1.55859375, -1.48291015625, -1.4072265625, -1.33154296875, -1.255859375, -1.18017578125, -1.1044921875, -1.02880859375, -0.953125, -0.87744140625, -0.8017578125, -0.72607421875, -0.650390625, -0.57470703125, -0.4990234375, -0.42333984375, -0.34765625, -0.27197265625, -0.1962890625, -0.12060546875, -0.044921875, 0.03076171875, 0.1064453125, 0.18212890625, 0.2578125, 0.33349609375, 0.4091796875, 0.48486328125, 0.560546875, 0.63623046875, 0.7119140625, 0.78759765625, 0.86328125, 0.93896484375, 1.0146484375, 1.09033203125, 1.166015625, 1.24169921875, 1.3173828125, 1.39306640625, 1.46875, 1.54443359375, 1.6201171875, 1.69580078125, 1.771484375, 1.84716796875, 1.9228515625, 1.99853515625, 2.07421875]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 7.0, 7.0, 6.0, 6.0, 9.0, 14.0, 19.0, 31.0, 32.0, 38.0, 36.0, 55.0, 47.0, 50.0, 49.0, 59.0, 66.0, 66.0, 71.0, 68.0, 52.0, 48.0, 37.0, 36.0, 27.0, 22.0, 13.0, 8.0, 10.0, 13.0, 5.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.01953125, -2.9312744140625, -2.843017578125, -2.7547607421875, -2.66650390625, -2.5782470703125, -2.489990234375, -2.4017333984375, -2.3134765625, -2.2252197265625, -2.136962890625, -2.0487060546875, -1.96044921875, -1.8721923828125, -1.783935546875, -1.6956787109375, -1.607421875, -1.5191650390625, -1.430908203125, -1.3426513671875, -1.25439453125, -1.1661376953125, -1.077880859375, -0.9896240234375, -0.9013671875, -0.8131103515625, -0.724853515625, -0.6365966796875, -0.54833984375, -0.4600830078125, -0.371826171875, -0.2835693359375, -0.1953125, -0.1070556640625, -0.018798828125, 0.0694580078125, 0.15771484375, 0.2459716796875, 0.334228515625, 0.4224853515625, 0.5107421875, 0.5989990234375, 0.687255859375, 0.7755126953125, 0.86376953125, 0.9520263671875, 1.040283203125, 1.1285400390625, 1.216796875, 1.3050537109375, 1.393310546875, 1.4815673828125, 1.56982421875, 1.6580810546875, 1.746337890625, 1.8345947265625, 1.9228515625, 2.0111083984375, 2.099365234375, 2.1876220703125, 2.27587890625, 2.3641357421875, 2.452392578125, 2.5406494140625, 2.62890625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 5.0, 3.0, 2.0, 3.0, 0.0, 1.0, 3.0, 10.0, 4.0, 12.0, 20.0, 28.0, 44.0, 47.0, 97.0, 162.0, 243.0, 485.0, 1168.0, 3630.0, 24422.0, 656107.0, 3401470.0, 94073.0, 8493.0, 1974.0, 792.0, 406.0, 210.0, 125.0, 82.0, 57.0, 32.0, 27.0, 19.0, 7.0, 9.0, 6.0, 3.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.32421875, -5.14215087890625, -4.9600830078125, -4.77801513671875, -4.595947265625, -4.41387939453125, -4.2318115234375, -4.04974365234375, -3.86767578125, -3.68560791015625, -3.5035400390625, -3.32147216796875, -3.139404296875, -2.95733642578125, -2.7752685546875, -2.59320068359375, -2.4111328125, -2.22906494140625, -2.0469970703125, -1.86492919921875, -1.682861328125, -1.50079345703125, -1.3187255859375, -1.13665771484375, -0.95458984375, -0.77252197265625, -0.5904541015625, -0.40838623046875, -0.226318359375, -0.04425048828125, 0.1378173828125, 0.31988525390625, 0.501953125, 0.68402099609375, 0.8660888671875, 1.04815673828125, 1.230224609375, 1.41229248046875, 1.5943603515625, 1.77642822265625, 1.95849609375, 2.14056396484375, 2.3226318359375, 2.50469970703125, 2.686767578125, 2.86883544921875, 3.0509033203125, 3.23297119140625, 3.4150390625, 3.59710693359375, 3.7791748046875, 3.96124267578125, 4.143310546875, 4.32537841796875, 4.5074462890625, 4.68951416015625, 4.87158203125, 5.05364990234375, 5.2357177734375, 5.41778564453125, 5.599853515625, 5.78192138671875, 5.9639892578125, 6.14605712890625, 6.328125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 5.0, 3.0, 7.0, 11.0, 15.0, 26.0, 53.0, 88.0, 170.0, 342.0, 575.0, 861.0, 778.0, 511.0, 247.0, 154.0, 104.0, 51.0, 33.0, 17.0, 9.0, 7.0, 7.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.728515625, -3.530853271484375, -3.33319091796875, -3.135528564453125, -2.9378662109375, -2.740203857421875, -2.54254150390625, -2.344879150390625, -2.147216796875, -1.949554443359375, -1.75189208984375, -1.554229736328125, -1.3565673828125, -1.158905029296875, -0.96124267578125, -0.763580322265625, -0.56591796875, -0.368255615234375, -0.17059326171875, 0.027069091796875, 0.2247314453125, 0.422393798828125, 0.62005615234375, 0.817718505859375, 1.015380859375, 1.213043212890625, 1.41070556640625, 1.608367919921875, 1.8060302734375, 2.003692626953125, 2.20135498046875, 2.399017333984375, 2.5966796875, 2.794342041015625, 2.99200439453125, 3.189666748046875, 3.3873291015625, 3.584991455078125, 3.78265380859375, 3.980316162109375, 4.177978515625, 4.375640869140625, 4.57330322265625, 4.770965576171875, 4.9686279296875, 5.166290283203125, 5.36395263671875, 5.561614990234375, 5.75927734375, 5.956939697265625, 6.15460205078125, 6.352264404296875, 6.5499267578125, 6.747589111328125, 6.94525146484375, 7.142913818359375, 7.340576171875, 7.538238525390625, 7.73590087890625, 7.933563232421875, 8.1312255859375, 8.328887939453125, 8.52655029296875, 8.724212646484375, 8.921875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 7.0, 11.0, 9.0, 23.0, 75.0, 153.0, 253.0, 237.0, 119.0, 62.0, 28.0, 12.0, 4.0, 5.0, 3.0, 1.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-46.820858001708984, -45.06989288330078, -43.318931579589844, -41.56796646118164, -39.8170051574707, -38.0660400390625, -36.31507873535156, -34.56411361694336, -32.813148498535156, -31.062185287475586, -29.311222076416016, -27.560256958007812, -25.809295654296875, -24.058330535888672, -22.3073673248291, -20.55640411376953, -18.805442810058594, -17.054479598999023, -15.303516387939453, -13.552552223205566, -11.801589012145996, -10.050625801086426, -8.299661636352539, -6.548698425292969, -4.797735214233398, -3.046771764755249, -1.2958083152770996, 0.4551553726196289, 2.206118583679199, 3.9570817947387695, 5.708045959472656, 7.459009170532227, 9.209968566894531, 10.960931777954102, 12.711894989013672, 14.462859153747559, 16.213821411132812, 17.964786529541016, 19.715749740600586, 21.466712951660156, 23.217676162719727, 24.968639373779297, 26.719602584838867, 28.470565795898438, 30.22153091430664, 31.972492218017578, 33.72345733642578, 35.47441864013672, 37.22538375854492, 38.976348876953125, 40.72731018066406, 42.478275299072266, 44.2292366027832, 45.980201721191406, 47.731163024902344, 49.48212814331055, 51.23309326171875, 52.98405838012695, 54.73501968383789, 56.485984802246094, 58.23694610595703, 59.987911224365234, 61.73887634277344, 63.489837646484375, 65.24079895019531]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 8.0, 6.0, 9.0, 7.0, 12.0, 8.0, 22.0, 15.0, 39.0, 32.0, 35.0, 46.0, 47.0, 52.0, 56.0, 46.0, 50.0, 50.0, 56.0, 46.0, 61.0, 40.0, 43.0, 40.0, 38.0, 24.0, 28.0, 17.0, 17.0, 12.0, 10.0, 11.0, 8.0, 6.0, 4.0, 5.0, 1.0, 2.0, 3.0], "bins": [-32.34654235839844, -31.590980529785156, -30.835418701171875, -30.079858779907227, -29.324296951293945, -28.568735122680664, -27.813173294067383, -27.057613372802734, -26.302051544189453, -25.546489715576172, -24.79092788696289, -24.035367965698242, -23.27980613708496, -22.52424430847168, -21.7686824798584, -21.01312255859375, -20.25756072998047, -19.501998901367188, -18.746437072753906, -17.990877151489258, -17.235315322875977, -16.479753494262695, -15.724191665649414, -14.96863079071045, -14.213068008422852, -13.45750617980957, -12.701945304870605, -11.946383476257324, -11.19082260131836, -10.435260772705078, -9.679698944091797, -8.924138069152832, -8.168577194213867, -7.413015842437744, -6.657454490661621, -5.90189266204834, -5.146331787109375, -4.390769958496094, -3.6352086067199707, -2.8796472549438477, -2.1240859031677246, -1.3685245513916016, -0.612963080406189, 0.14259839057922363, 0.8981597423553467, 1.6537210941314697, 2.409282684326172, 3.164844036102295, 3.920405387878418, 4.675966739654541, 5.431528091430664, 6.187089920043945, 6.94265079498291, 7.698212623596191, 8.453773498535156, 9.209335327148438, 9.964897155761719, 10.720458984375, 11.476019859313965, 12.231581687927246, 12.987142562866211, 13.742704391479492, 14.498266220092773, 15.253827095031738, 16.009387969970703]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 4.0, 5.0, 10.0, 12.0, 12.0, 19.0, 29.0, 50.0, 50.0, 112.0, 193.0, 262.0, 465.0, 859.0, 1387.0, 2696.0, 5062.0, 9946.0, 20972.0, 45735.0, 109176.0, 252419.0, 315840.0, 159730.0, 66093.0, 28963.0, 13559.0, 6961.0, 3536.0, 1876.0, 1002.0, 596.0, 345.0, 210.0, 125.0, 93.0, 59.0, 33.0, 22.0, 12.0, 13.0, 6.0, 9.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.953125, -2.8585205078125, -2.763916015625, -2.6693115234375, -2.57470703125, -2.4801025390625, -2.385498046875, -2.2908935546875, -2.1962890625, -2.1016845703125, -2.007080078125, -1.9124755859375, -1.81787109375, -1.7232666015625, -1.628662109375, -1.5340576171875, -1.439453125, -1.3448486328125, -1.250244140625, -1.1556396484375, -1.06103515625, -0.9664306640625, -0.871826171875, -0.7772216796875, -0.6826171875, -0.5880126953125, -0.493408203125, -0.3988037109375, -0.30419921875, -0.2095947265625, -0.114990234375, -0.0203857421875, 0.07421875, 0.1688232421875, 0.263427734375, 0.3580322265625, 0.45263671875, 0.5472412109375, 0.641845703125, 0.7364501953125, 0.8310546875, 0.9256591796875, 1.020263671875, 1.1148681640625, 1.20947265625, 1.3040771484375, 1.398681640625, 1.4932861328125, 1.587890625, 1.6824951171875, 1.777099609375, 1.8717041015625, 1.96630859375, 2.0609130859375, 2.155517578125, 2.2501220703125, 2.3447265625, 2.4393310546875, 2.533935546875, 2.6285400390625, 2.72314453125, 2.8177490234375, 2.912353515625, 3.0069580078125, 3.1015625]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 8.0, 5.0, 8.0, 7.0, 15.0, 20.0, 17.0, 21.0, 29.0, 41.0, 47.0, 48.0, 49.0, 57.0, 63.0, 64.0, 56.0, 66.0, 71.0, 42.0, 58.0, 43.0, 41.0, 24.0, 27.0, 19.0, 25.0, 13.0, 4.0, 12.0, 7.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.005859375, -2.917144775390625, -2.82843017578125, -2.739715576171875, -2.6510009765625, -2.562286376953125, -2.47357177734375, -2.384857177734375, -2.296142578125, -2.207427978515625, -2.11871337890625, -2.029998779296875, -1.9412841796875, -1.852569580078125, -1.76385498046875, -1.675140380859375, -1.58642578125, -1.497711181640625, -1.40899658203125, -1.320281982421875, -1.2315673828125, -1.142852783203125, -1.05413818359375, -0.965423583984375, -0.876708984375, -0.787994384765625, -0.69927978515625, -0.610565185546875, -0.5218505859375, -0.433135986328125, -0.34442138671875, -0.255706787109375, -0.1669921875, -0.078277587890625, 0.01043701171875, 0.099151611328125, 0.1878662109375, 0.276580810546875, 0.36529541015625, 0.454010009765625, 0.542724609375, 0.631439208984375, 0.72015380859375, 0.808868408203125, 0.8975830078125, 0.986297607421875, 1.07501220703125, 1.163726806640625, 1.25244140625, 1.341156005859375, 1.42987060546875, 1.518585205078125, 1.6072998046875, 1.696014404296875, 1.78472900390625, 1.873443603515625, 1.962158203125, 2.050872802734375, 2.13958740234375, 2.228302001953125, 2.3170166015625, 2.405731201171875, 2.49444580078125, 2.583160400390625, 2.671875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 3.0, 4.0, 5.0, 10.0, 9.0, 16.0, 18.0, 24.0, 43.0, 50.0, 54.0, 64.0, 96.0, 114.0, 200.0, 285.0, 369.0, 560.0, 866.0, 1526.0, 3475.0, 11150.0, 57387.0, 651509.0, 267821.0, 37971.0, 8329.0, 2758.0, 1346.0, 752.0, 481.0, 345.0, 239.0, 182.0, 117.0, 94.0, 71.0, 60.0, 35.0, 30.0, 29.0, 18.0, 13.0, 8.0, 5.0, 6.0, 4.0, 6.0, 1.0, 2.0, 0.0, 0.0, 3.0], "bins": [-6.11328125, -5.93804931640625, -5.7628173828125, -5.58758544921875, -5.412353515625, -5.23712158203125, -5.0618896484375, -4.88665771484375, -4.71142578125, -4.53619384765625, -4.3609619140625, -4.18572998046875, -4.010498046875, -3.83526611328125, -3.6600341796875, -3.48480224609375, -3.3095703125, -3.13433837890625, -2.9591064453125, -2.78387451171875, -2.608642578125, -2.43341064453125, -2.2581787109375, -2.08294677734375, -1.90771484375, -1.73248291015625, -1.5572509765625, -1.38201904296875, -1.206787109375, -1.03155517578125, -0.8563232421875, -0.68109130859375, -0.505859375, -0.33062744140625, -0.1553955078125, 0.01983642578125, 0.195068359375, 0.37030029296875, 0.5455322265625, 0.72076416015625, 0.89599609375, 1.07122802734375, 1.2464599609375, 1.42169189453125, 1.596923828125, 1.77215576171875, 1.9473876953125, 2.12261962890625, 2.2978515625, 2.47308349609375, 2.6483154296875, 2.82354736328125, 2.998779296875, 3.17401123046875, 3.3492431640625, 3.52447509765625, 3.69970703125, 3.87493896484375, 4.0501708984375, 4.22540283203125, 4.400634765625, 4.57586669921875, 4.7510986328125, 4.92633056640625, 5.1015625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 4.0, 5.0, 7.0, 3.0, 2.0, 4.0, 14.0, 10.0, 15.0, 22.0, 27.0, 23.0, 32.0, 29.0, 45.0, 46.0, 61.0, 61.0, 67.0, 60.0, 69.0, 61.0, 60.0, 59.0, 35.0, 34.0, 31.0, 22.0, 17.0, 19.0, 13.0, 10.0, 14.0, 5.0, 4.0, 9.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.3671875, -9.078857421875, -8.79052734375, -8.502197265625, -8.2138671875, -7.925537109375, -7.63720703125, -7.348876953125, -7.060546875, -6.772216796875, -6.48388671875, -6.195556640625, -5.9072265625, -5.618896484375, -5.33056640625, -5.042236328125, -4.75390625, -4.465576171875, -4.17724609375, -3.888916015625, -3.6005859375, -3.312255859375, -3.02392578125, -2.735595703125, -2.447265625, -2.158935546875, -1.87060546875, -1.582275390625, -1.2939453125, -1.005615234375, -0.71728515625, -0.428955078125, -0.140625, 0.147705078125, 0.43603515625, 0.724365234375, 1.0126953125, 1.301025390625, 1.58935546875, 1.877685546875, 2.166015625, 2.454345703125, 2.74267578125, 3.031005859375, 3.3193359375, 3.607666015625, 3.89599609375, 4.184326171875, 4.47265625, 4.760986328125, 5.04931640625, 5.337646484375, 5.6259765625, 5.914306640625, 6.20263671875, 6.490966796875, 6.779296875, 7.067626953125, 7.35595703125, 7.644287109375, 7.9326171875, 8.220947265625, 8.50927734375, 8.797607421875, 9.0859375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 3.0, 1.0, 9.0, 7.0, 13.0, 12.0, 15.0, 26.0, 35.0, 62.0, 110.0, 216.0, 493.0, 1289.0, 3971.0, 16528.0, 116361.0, 801208.0, 89085.0, 13638.0, 3428.0, 1110.0, 439.0, 187.0, 114.0, 72.0, 25.0, 25.0, 16.0, 11.0, 13.0, 7.0, 5.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.833984375, -1.7774505615234375, -1.720916748046875, -1.6643829345703125, -1.60784912109375, -1.5513153076171875, -1.494781494140625, -1.4382476806640625, -1.3817138671875, -1.3251800537109375, -1.268646240234375, -1.2121124267578125, -1.15557861328125, -1.0990447998046875, -1.042510986328125, -0.9859771728515625, -0.929443359375, -0.8729095458984375, -0.816375732421875, -0.7598419189453125, -0.70330810546875, -0.6467742919921875, -0.590240478515625, -0.5337066650390625, -0.4771728515625, -0.4206390380859375, -0.364105224609375, -0.3075714111328125, -0.25103759765625, -0.1945037841796875, -0.137969970703125, -0.0814361572265625, -0.02490234375, 0.0316314697265625, 0.088165283203125, 0.1446990966796875, 0.20123291015625, 0.2577667236328125, 0.314300537109375, 0.3708343505859375, 0.4273681640625, 0.4839019775390625, 0.540435791015625, 0.5969696044921875, 0.65350341796875, 0.7100372314453125, 0.766571044921875, 0.8231048583984375, 0.879638671875, 0.9361724853515625, 0.992706298828125, 1.0492401123046875, 1.10577392578125, 1.1623077392578125, 1.218841552734375, 1.2753753662109375, 1.3319091796875, 1.3884429931640625, 1.444976806640625, 1.5015106201171875, 1.55804443359375, 1.6145782470703125, 1.671112060546875, 1.7276458740234375, 1.7841796875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 6.0, 8.0, 10.0, 6.0, 6.0, 10.0, 21.0, 18.0, 30.0, 42.0, 65.0, 65.0, 92.0, 99.0, 109.0, 92.0, 60.0, 70.0, 59.0, 40.0, 27.0, 19.0, 11.0, 8.0, 9.0, 6.0, 6.0, 1.0, 1.0, 2.0, 5.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004982948303222656, -0.000482410192489624, -0.0004665255546569824, -0.0004506409168243408, -0.0004347562789916992, -0.0004188716411590576, -0.000402987003326416, -0.0003871023654937744, -0.0003712177276611328, -0.0003553330898284912, -0.0003394484519958496, -0.000323563814163208, -0.0003076791763305664, -0.0002917945384979248, -0.0002759099006652832, -0.0002600252628326416, -0.000244140625, -0.0002282559871673584, -0.0002123713493347168, -0.0001964867115020752, -0.0001806020736694336, -0.000164717435836792, -0.0001488327980041504, -0.0001329481601715088, -0.00011706352233886719, -0.00010117888450622559, -8.529424667358398e-05, -6.940960884094238e-05, -5.352497100830078e-05, -3.764033317565918e-05, -2.1755695343017578e-05, -5.8710575103759766e-06, 1.0013580322265625e-05, 2.5898218154907227e-05, 4.178285598754883e-05, 5.766749382019043e-05, 7.355213165283203e-05, 8.943676948547363e-05, 0.00010532140731811523, 0.00012120604515075684, 0.00013709068298339844, 0.00015297532081604004, 0.00016885995864868164, 0.00018474459648132324, 0.00020062923431396484, 0.00021651387214660645, 0.00023239850997924805, 0.00024828314781188965, 0.00026416778564453125, 0.00028005242347717285, 0.00029593706130981445, 0.00031182169914245605, 0.00032770633697509766, 0.00034359097480773926, 0.00035947561264038086, 0.00037536025047302246, 0.00039124488830566406, 0.00040712952613830566, 0.00042301416397094727, 0.00043889880180358887, 0.00045478343963623047, 0.00047066807746887207, 0.00048655271530151367, 0.0005024373531341553, 0.0005183219909667969]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 7.0, 4.0, 3.0, 10.0, 17.0, 18.0, 21.0, 38.0, 60.0, 82.0, 174.0, 301.0, 566.0, 1249.0, 3301.0, 12821.0, 81895.0, 769105.0, 150831.0, 20115.0, 4817.0, 1543.0, 718.0, 346.0, 192.0, 114.0, 54.0, 52.0, 28.0, 18.0, 12.0, 12.0, 8.0, 10.0, 5.0, 5.0, 3.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.703125, -1.652496337890625, -1.60186767578125, -1.551239013671875, -1.5006103515625, -1.449981689453125, -1.39935302734375, -1.348724365234375, -1.298095703125, -1.247467041015625, -1.19683837890625, -1.146209716796875, -1.0955810546875, -1.044952392578125, -0.99432373046875, -0.943695068359375, -0.89306640625, -0.842437744140625, -0.79180908203125, -0.741180419921875, -0.6905517578125, -0.639923095703125, -0.58929443359375, -0.538665771484375, -0.488037109375, -0.437408447265625, -0.38677978515625, -0.336151123046875, -0.2855224609375, -0.234893798828125, -0.18426513671875, -0.133636474609375, -0.0830078125, -0.032379150390625, 0.01824951171875, 0.068878173828125, 0.1195068359375, 0.170135498046875, 0.22076416015625, 0.271392822265625, 0.322021484375, 0.372650146484375, 0.42327880859375, 0.473907470703125, 0.5245361328125, 0.575164794921875, 0.62579345703125, 0.676422119140625, 0.72705078125, 0.777679443359375, 0.82830810546875, 0.878936767578125, 0.9295654296875, 0.980194091796875, 1.03082275390625, 1.081451416015625, 1.132080078125, 1.182708740234375, 1.23333740234375, 1.283966064453125, 1.3345947265625, 1.385223388671875, 1.43585205078125, 1.486480712890625, 1.537109375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 7.0, 7.0, 8.0, 10.0, 9.0, 19.0, 29.0, 19.0, 37.0, 44.0, 52.0, 50.0, 77.0, 105.0, 96.0, 74.0, 62.0, 68.0, 44.0, 36.0, 19.0, 24.0, 16.0, 14.0, 19.0, 12.0, 7.0, 5.0, 8.0, 3.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1728515625, -1.13238525390625, -1.0919189453125, -1.05145263671875, -1.010986328125, -0.97052001953125, -0.9300537109375, -0.88958740234375, -0.84912109375, -0.80865478515625, -0.7681884765625, -0.72772216796875, -0.687255859375, -0.64678955078125, -0.6063232421875, -0.56585693359375, -0.525390625, -0.48492431640625, -0.4444580078125, -0.40399169921875, -0.363525390625, -0.32305908203125, -0.2825927734375, -0.24212646484375, -0.20166015625, -0.16119384765625, -0.1207275390625, -0.08026123046875, -0.039794921875, 0.00067138671875, 0.0411376953125, 0.08160400390625, 0.1220703125, 0.16253662109375, 0.2030029296875, 0.24346923828125, 0.283935546875, 0.32440185546875, 0.3648681640625, 0.40533447265625, 0.44580078125, 0.48626708984375, 0.5267333984375, 0.56719970703125, 0.607666015625, 0.64813232421875, 0.6885986328125, 0.72906494140625, 0.76953125, 0.80999755859375, 0.8504638671875, 0.89093017578125, 0.931396484375, 0.97186279296875, 1.0123291015625, 1.05279541015625, 1.09326171875, 1.13372802734375, 1.1741943359375, 1.21466064453125, 1.255126953125, 1.29559326171875, 1.3360595703125, 1.37652587890625, 1.4169921875]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 2.0, 4.0, 21.0, 45.0, 107.0, 384.0, 278.0, 101.0, 37.0, 15.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-86.36686706542969, -84.25753021240234, -82.148193359375, -80.03885650634766, -77.92951965332031, -75.82018280029297, -73.71084594726562, -71.60150146484375, -69.49217224121094, -67.3828353881836, -65.27349853515625, -63.164161682128906, -61.05482482910156, -58.94548797607422, -56.83614730834961, -54.726810455322266, -52.617469787597656, -50.50813293457031, -48.39879608154297, -46.289459228515625, -44.18012237548828, -42.07078552246094, -39.96144485473633, -37.852108001708984, -35.74277114868164, -33.6334342956543, -31.524097442626953, -29.414758682250977, -27.305421829223633, -25.19608497619629, -23.086746215820312, -20.97740936279297, -18.868072509765625, -16.75873565673828, -14.649397850036621, -12.540060043334961, -10.430723190307617, -8.321386337280273, -6.212048530578613, -4.102710723876953, -1.9933738708496094, 0.11596345901489258, 2.2253007888793945, 4.3346381187438965, 6.443975448608398, 8.553312301635742, 10.662650108337402, 12.771987915039062, 14.881324768066406, 16.99066162109375, 19.099998474121094, 21.20933723449707, 23.318674087524414, 25.428010940551758, 27.537349700927734, 29.646686553955078, 31.756023406982422, 33.865360260009766, 35.97469711303711, 38.08403396606445, 40.19337463378906, 42.302711486816406, 44.41204833984375, 46.521385192871094, 48.63072204589844]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 8.0, 11.0, 15.0, 9.0, 7.0, 14.0, 15.0, 21.0, 25.0, 24.0, 31.0, 28.0, 41.0, 45.0, 55.0, 131.0, 157.0, 65.0, 32.0, 35.0, 33.0, 33.0, 17.0, 27.0, 24.0, 14.0, 13.0, 12.0, 12.0, 10.0, 9.0, 6.0, 2.0, 4.0, 6.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-33.65927505493164, -32.641571044921875, -31.623870849609375, -30.606168746948242, -29.58846664428711, -28.570762634277344, -27.55306053161621, -26.535358428955078, -25.517656326293945, -24.499954223632812, -23.48225212097168, -22.464550018310547, -21.44684600830078, -20.42914581298828, -19.411441802978516, -18.393739700317383, -17.37603759765625, -16.358335494995117, -15.340633392333984, -14.322930335998535, -13.305228233337402, -12.28752613067627, -11.26982307434082, -10.252120971679688, -9.234418869018555, -8.216716766357422, -7.199014186859131, -6.18131160736084, -5.163609504699707, -4.145907402038574, -3.128204822540283, -2.110502243041992, -1.0927982330322266, -0.07509589195251465, 0.9426064491271973, 1.9603087902069092, 2.978011131286621, 3.995713233947754, 5.013415813446045, 6.031118392944336, 7.048820495605469, 8.066522598266602, 9.084224700927734, 10.101927757263184, 11.119629859924316, 12.13733196258545, 13.155035018920898, 14.172737121582031, 15.190439224243164, 16.208141326904297, 17.22584342956543, 18.243545532226562, 19.261249542236328, 20.278949737548828, 21.296653747558594, 22.314355850219727, 23.33205795288086, 24.349760055541992, 25.367462158203125, 26.385164260864258, 27.40286636352539, 28.420570373535156, 29.43827247619629, 30.455974578857422, 31.473676681518555]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 0.0, 4.0, 4.0, 9.0, 11.0, 14.0, 14.0, 20.0, 34.0, 46.0, 55.0, 76.0, 119.0, 171.0, 207.0, 331.0, 501.0, 704.0, 1175.0, 1766.0, 3249.0, 6118.0, 12939.0, 30286.0, 84066.0, 246068.0, 640854.0, 1218764.0, 1101075.0, 525050.0, 198834.0, 70403.0, 26405.0, 11622.0, 5553.0, 2816.0, 1728.0, 1107.0, 672.0, 455.0, 283.0, 206.0, 137.0, 84.0, 75.0, 33.0, 40.0, 31.0, 15.0, 17.0, 14.0, 10.0, 3.0, 10.0, 5.0, 2.0, 3.0], "bins": [-2.099609375, -2.0394439697265625, -1.979278564453125, -1.9191131591796875, -1.85894775390625, -1.7987823486328125, -1.738616943359375, -1.6784515380859375, -1.6182861328125, -1.5581207275390625, -1.497955322265625, -1.4377899169921875, -1.37762451171875, -1.3174591064453125, -1.257293701171875, -1.1971282958984375, -1.136962890625, -1.0767974853515625, -1.016632080078125, -0.9564666748046875, -0.89630126953125, -0.8361358642578125, -0.775970458984375, -0.7158050537109375, -0.6556396484375, -0.5954742431640625, -0.535308837890625, -0.4751434326171875, -0.41497802734375, -0.3548126220703125, -0.294647216796875, -0.2344818115234375, -0.17431640625, -0.1141510009765625, -0.053985595703125, 0.0061798095703125, 0.06634521484375, 0.1265106201171875, 0.186676025390625, 0.2468414306640625, 0.3070068359375, 0.3671722412109375, 0.427337646484375, 0.4875030517578125, 0.54766845703125, 0.6078338623046875, 0.667999267578125, 0.7281646728515625, 0.788330078125, 0.8484954833984375, 0.908660888671875, 0.9688262939453125, 1.02899169921875, 1.0891571044921875, 1.149322509765625, 1.2094879150390625, 1.2696533203125, 1.3298187255859375, 1.389984130859375, 1.4501495361328125, 1.51031494140625, 1.5704803466796875, 1.630645751953125, 1.6908111572265625, 1.7509765625]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 1.0, 2.0, 7.0, 11.0, 9.0, 7.0, 14.0, 11.0, 20.0, 15.0, 28.0, 31.0, 37.0, 41.0, 46.0, 46.0, 59.0, 53.0, 39.0, 45.0, 58.0, 52.0, 48.0, 52.0, 41.0, 39.0, 33.0, 27.0, 20.0, 26.0, 19.0, 17.0, 15.0, 9.0, 7.0, 4.0, 4.0, 4.0, 6.0, 1.0, 4.0, 0.0, 0.0, 1.0], "bins": [-2.71875, -2.6495208740234375, -2.580291748046875, -2.5110626220703125, -2.44183349609375, -2.3726043701171875, -2.303375244140625, -2.2341461181640625, -2.1649169921875, -2.0956878662109375, -2.026458740234375, -1.9572296142578125, -1.88800048828125, -1.8187713623046875, -1.749542236328125, -1.6803131103515625, -1.611083984375, -1.5418548583984375, -1.472625732421875, -1.4033966064453125, -1.33416748046875, -1.2649383544921875, -1.195709228515625, -1.1264801025390625, -1.0572509765625, -0.9880218505859375, -0.918792724609375, -0.8495635986328125, -0.78033447265625, -0.7111053466796875, -0.641876220703125, -0.5726470947265625, -0.50341796875, -0.4341888427734375, -0.364959716796875, -0.2957305908203125, -0.22650146484375, -0.1572723388671875, -0.088043212890625, -0.0188140869140625, 0.0504150390625, 0.1196441650390625, 0.188873291015625, 0.2581024169921875, 0.32733154296875, 0.3965606689453125, 0.465789794921875, 0.5350189208984375, 0.604248046875, 0.6734771728515625, 0.742706298828125, 0.8119354248046875, 0.88116455078125, 0.9503936767578125, 1.019622802734375, 1.0888519287109375, 1.1580810546875, 1.2273101806640625, 1.296539306640625, 1.3657684326171875, 1.43499755859375, 1.5042266845703125, 1.573455810546875, 1.6426849365234375, 1.7119140625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 2.0, 9.0, 15.0, 21.0, 37.0, 55.0, 129.0, 182.0, 438.0, 965.0, 2824.0, 18566.0, 3732975.0, 427862.0, 7130.0, 1668.0, 729.0, 325.0, 147.0, 78.0, 56.0, 29.0, 14.0, 10.0, 11.0, 3.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.8515625, -11.425537109375, -10.99951171875, -10.573486328125, -10.1474609375, -9.721435546875, -9.29541015625, -8.869384765625, -8.443359375, -8.017333984375, -7.59130859375, -7.165283203125, -6.7392578125, -6.313232421875, -5.88720703125, -5.461181640625, -5.03515625, -4.609130859375, -4.18310546875, -3.757080078125, -3.3310546875, -2.905029296875, -2.47900390625, -2.052978515625, -1.626953125, -1.200927734375, -0.77490234375, -0.348876953125, 0.0771484375, 0.503173828125, 0.92919921875, 1.355224609375, 1.78125, 2.207275390625, 2.63330078125, 3.059326171875, 3.4853515625, 3.911376953125, 4.33740234375, 4.763427734375, 5.189453125, 5.615478515625, 6.04150390625, 6.467529296875, 6.8935546875, 7.319580078125, 7.74560546875, 8.171630859375, 8.59765625, 9.023681640625, 9.44970703125, 9.875732421875, 10.3017578125, 10.727783203125, 11.15380859375, 11.579833984375, 12.005859375, 12.431884765625, 12.85791015625, 13.283935546875, 13.7099609375, 14.135986328125, 14.56201171875, 14.988037109375, 15.4140625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 6.0, 4.0, 8.0, 5.0, 13.0, 28.0, 32.0, 55.0, 83.0, 121.0, 175.0, 265.0, 366.0, 470.0, 567.0, 545.0, 439.0, 289.0, 204.0, 124.0, 91.0, 63.0, 41.0, 37.0, 17.0, 9.0, 6.0, 2.0, 5.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.64453125, -4.43145751953125, -4.2183837890625, -4.00531005859375, -3.792236328125, -3.57916259765625, -3.3660888671875, -3.15301513671875, -2.93994140625, -2.72686767578125, -2.5137939453125, -2.30072021484375, -2.087646484375, -1.87457275390625, -1.6614990234375, -1.44842529296875, -1.2353515625, -1.02227783203125, -0.8092041015625, -0.59613037109375, -0.383056640625, -0.16998291015625, 0.0430908203125, 0.25616455078125, 0.46923828125, 0.68231201171875, 0.8953857421875, 1.10845947265625, 1.321533203125, 1.53460693359375, 1.7476806640625, 1.96075439453125, 2.173828125, 2.38690185546875, 2.5999755859375, 2.81304931640625, 3.026123046875, 3.23919677734375, 3.4522705078125, 3.66534423828125, 3.87841796875, 4.09149169921875, 4.3045654296875, 4.51763916015625, 4.730712890625, 4.94378662109375, 5.1568603515625, 5.36993408203125, 5.5830078125, 5.79608154296875, 6.0091552734375, 6.22222900390625, 6.435302734375, 6.64837646484375, 6.8614501953125, 7.07452392578125, 7.28759765625, 7.50067138671875, 7.7137451171875, 7.92681884765625, 8.139892578125, 8.35296630859375, 8.5660400390625, 8.77911376953125, 8.9921875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 6.0, 9.0, 8.0, 24.0, 49.0, 145.0, 288.0, 266.0, 112.0, 53.0, 20.0, 9.0, 4.0, 4.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-164.75033569335938, -161.0089111328125, -157.26747131347656, -153.5260467529297, -149.78460693359375, -146.04318237304688, -142.3017578125, -138.56031799316406, -134.8188934326172, -131.0774688720703, -127.33602905273438, -123.5946044921875, -119.8531723022461, -116.11174011230469, -112.37030792236328, -108.62887573242188, -104.88744354248047, -101.14601135253906, -97.40457916259766, -93.66314697265625, -89.92172241210938, -86.18029022216797, -82.43885803222656, -78.69742584228516, -74.95599365234375, -71.21456146240234, -67.47312927246094, -63.7317008972168, -59.990272521972656, -56.24884033203125, -52.507408142089844, -48.76597595214844, -45.02455139160156, -41.283119201660156, -37.541690826416016, -33.80025863647461, -30.058828353881836, -26.317398071289062, -22.575965881347656, -18.834535598754883, -15.09310531616211, -11.351675033569336, -7.610243797302246, -3.8688125610351562, -0.1273822784423828, 3.6140480041503906, 7.355480194091797, 11.09691047668457, 14.838340759277344, 18.579771041870117, 22.32120132446289, 26.062633514404297, 29.80406379699707, 33.545494079589844, 37.28692626953125, 41.028358459472656, 44.7697868347168, 48.5112190246582, 52.252647399902344, 55.99407958984375, 59.735511779785156, 63.4769401550293, 67.21836853027344, 70.95980072021484, 74.70123291015625]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 5.0, 2.0, 3.0, 7.0, 10.0, 10.0, 11.0, 20.0, 26.0, 27.0, 33.0, 34.0, 40.0, 39.0, 40.0, 51.0, 51.0, 68.0, 61.0, 44.0, 45.0, 46.0, 54.0, 34.0, 33.0, 29.0, 32.0, 29.0, 19.0, 19.0, 13.0, 22.0, 11.0, 10.0, 5.0, 7.0, 7.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-33.44635772705078, -32.323265075683594, -31.200172424316406, -30.07707977294922, -28.95398712158203, -27.830894470214844, -26.70780372619629, -25.5847110748291, -24.461618423461914, -23.338525772094727, -22.21543312072754, -21.09234046936035, -19.969249725341797, -18.84615707397461, -17.723064422607422, -16.599971771240234, -15.476879119873047, -14.35378646850586, -13.230693817138672, -12.1076021194458, -10.984509468078613, -9.861416816711426, -8.738325119018555, -7.615232467651367, -6.49213981628418, -5.369047164916992, -4.245954990386963, -3.1228625774383545, -1.999770164489746, -0.8766775131225586, 0.2464146614074707, 1.3695068359375, 2.4925994873046875, 3.615691900253296, 4.738784313201904, 5.861876487731934, 6.984969139099121, 8.108061790466309, 9.23115348815918, 10.354246139526367, 11.477338790893555, 12.600431442260742, 13.72352409362793, 14.8466157913208, 15.969708442687988, 17.09280014038086, 18.215892791748047, 19.338985443115234, 20.462078094482422, 21.58517074584961, 22.708263397216797, 23.831356048583984, 24.954448699951172, 26.07754135131836, 27.200632095336914, 28.3237247467041, 29.44681739807129, 30.569910049438477, 31.693002700805664, 32.81609344482422, 33.939186096191406, 35.062278747558594, 36.18537139892578, 37.30846405029297, 38.431556701660156]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 14.0, 16.0, 14.0, 18.0, 35.0, 45.0, 77.0, 115.0, 179.0, 295.0, 638.0, 1190.0, 2313.0, 5169.0, 13390.0, 39746.0, 150191.0, 593470.0, 172259.0, 43957.0, 14446.0, 5642.0, 2535.0, 1238.0, 675.0, 345.0, 217.0, 111.0, 73.0, 44.0, 31.0, 14.0, 13.0, 12.0, 8.0, 8.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-4.4296875, -4.30145263671875, -4.1732177734375, -4.04498291015625, -3.916748046875, -3.78851318359375, -3.6602783203125, -3.53204345703125, -3.40380859375, -3.27557373046875, -3.1473388671875, -3.01910400390625, -2.890869140625, -2.76263427734375, -2.6343994140625, -2.50616455078125, -2.3779296875, -2.24969482421875, -2.1214599609375, -1.99322509765625, -1.864990234375, -1.73675537109375, -1.6085205078125, -1.48028564453125, -1.35205078125, -1.22381591796875, -1.0955810546875, -0.96734619140625, -0.839111328125, -0.71087646484375, -0.5826416015625, -0.45440673828125, -0.326171875, -0.19793701171875, -0.0697021484375, 0.05853271484375, 0.186767578125, 0.31500244140625, 0.4432373046875, 0.57147216796875, 0.69970703125, 0.82794189453125, 0.9561767578125, 1.08441162109375, 1.212646484375, 1.34088134765625, 1.4691162109375, 1.59735107421875, 1.7255859375, 1.85382080078125, 1.9820556640625, 2.11029052734375, 2.238525390625, 2.36676025390625, 2.4949951171875, 2.62322998046875, 2.75146484375, 2.87969970703125, 3.0079345703125, 3.13616943359375, 3.264404296875, 3.39263916015625, 3.5208740234375, 3.64910888671875, 3.77734375]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 6.0, 3.0, 13.0, 21.0, 21.0, 16.0, 40.0, 39.0, 67.0, 50.0, 65.0, 77.0, 85.0, 67.0, 77.0, 76.0, 53.0, 57.0, 43.0, 35.0, 19.0, 29.0, 18.0, 14.0, 6.0, 5.0, 5.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.466796875, -3.35174560546875, -3.2366943359375, -3.12164306640625, -3.006591796875, -2.89154052734375, -2.7764892578125, -2.66143798828125, -2.54638671875, -2.43133544921875, -2.3162841796875, -2.20123291015625, -2.086181640625, -1.97113037109375, -1.8560791015625, -1.74102783203125, -1.6259765625, -1.51092529296875, -1.3958740234375, -1.28082275390625, -1.165771484375, -1.05072021484375, -0.9356689453125, -0.82061767578125, -0.70556640625, -0.59051513671875, -0.4754638671875, -0.36041259765625, -0.245361328125, -0.13031005859375, -0.0152587890625, 0.09979248046875, 0.21484375, 0.32989501953125, 0.4449462890625, 0.55999755859375, 0.675048828125, 0.79010009765625, 0.9051513671875, 1.02020263671875, 1.13525390625, 1.25030517578125, 1.3653564453125, 1.48040771484375, 1.595458984375, 1.71051025390625, 1.8255615234375, 1.94061279296875, 2.0556640625, 2.17071533203125, 2.2857666015625, 2.40081787109375, 2.515869140625, 2.63092041015625, 2.7459716796875, 2.86102294921875, 2.97607421875, 3.09112548828125, 3.2061767578125, 3.32122802734375, 3.436279296875, 3.55133056640625, 3.6663818359375, 3.78143310546875, 3.896484375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 7.0, 7.0, 4.0, 6.0, 11.0, 20.0, 30.0, 26.0, 45.0, 70.0, 90.0, 126.0, 221.0, 392.0, 858.0, 2014.0, 7679.0, 56057.0, 899784.0, 68423.0, 8768.0, 2168.0, 812.0, 382.0, 212.0, 120.0, 58.0, 55.0, 32.0, 23.0, 13.0, 9.0, 10.0, 6.0, 6.0, 5.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.30078125, -6.10101318359375, -5.9012451171875, -5.70147705078125, -5.501708984375, -5.30194091796875, -5.1021728515625, -4.90240478515625, -4.70263671875, -4.50286865234375, -4.3031005859375, -4.10333251953125, -3.903564453125, -3.70379638671875, -3.5040283203125, -3.30426025390625, -3.1044921875, -2.90472412109375, -2.7049560546875, -2.50518798828125, -2.305419921875, -2.10565185546875, -1.9058837890625, -1.70611572265625, -1.50634765625, -1.30657958984375, -1.1068115234375, -0.90704345703125, -0.707275390625, -0.50750732421875, -0.3077392578125, -0.10797119140625, 0.091796875, 0.29156494140625, 0.4913330078125, 0.69110107421875, 0.890869140625, 1.09063720703125, 1.2904052734375, 1.49017333984375, 1.68994140625, 1.88970947265625, 2.0894775390625, 2.28924560546875, 2.489013671875, 2.68878173828125, 2.8885498046875, 3.08831787109375, 3.2880859375, 3.48785400390625, 3.6876220703125, 3.88739013671875, 4.087158203125, 4.28692626953125, 4.4866943359375, 4.68646240234375, 4.88623046875, 5.08599853515625, 5.2857666015625, 5.48553466796875, 5.685302734375, 5.88507080078125, 6.0848388671875, 6.28460693359375, 6.484375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 3.0, 2.0, 7.0, 3.0, 4.0, 7.0, 4.0, 14.0, 2.0, 12.0, 9.0, 16.0, 15.0, 18.0, 29.0, 18.0, 27.0, 26.0, 39.0, 51.0, 52.0, 61.0, 74.0, 77.0, 64.0, 65.0, 53.0, 50.0, 37.0, 35.0, 23.0, 20.0, 10.0, 14.0, 9.0, 12.0, 7.0, 5.0, 7.0, 5.0, 7.0, 2.0, 3.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.8828125, -8.591064453125, -8.29931640625, -8.007568359375, -7.7158203125, -7.424072265625, -7.13232421875, -6.840576171875, -6.548828125, -6.257080078125, -5.96533203125, -5.673583984375, -5.3818359375, -5.090087890625, -4.79833984375, -4.506591796875, -4.21484375, -3.923095703125, -3.63134765625, -3.339599609375, -3.0478515625, -2.756103515625, -2.46435546875, -2.172607421875, -1.880859375, -1.589111328125, -1.29736328125, -1.005615234375, -0.7138671875, -0.422119140625, -0.13037109375, 0.161376953125, 0.453125, 0.744873046875, 1.03662109375, 1.328369140625, 1.6201171875, 1.911865234375, 2.20361328125, 2.495361328125, 2.787109375, 3.078857421875, 3.37060546875, 3.662353515625, 3.9541015625, 4.245849609375, 4.53759765625, 4.829345703125, 5.12109375, 5.412841796875, 5.70458984375, 5.996337890625, 6.2880859375, 6.579833984375, 6.87158203125, 7.163330078125, 7.455078125, 7.746826171875, 8.03857421875, 8.330322265625, 8.6220703125, 8.913818359375, 9.20556640625, 9.497314453125, 9.7890625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 3.0, 4.0, 4.0, 5.0, 12.0, 16.0, 24.0, 31.0, 44.0, 53.0, 78.0, 126.0, 172.0, 293.0, 507.0, 1004.0, 2065.0, 4888.0, 13962.0, 52763.0, 816453.0, 119711.0, 22745.0, 7507.0, 2954.0, 1369.0, 690.0, 386.0, 214.0, 151.0, 88.0, 69.0, 45.0, 28.0, 26.0, 19.0, 6.0, 11.0, 5.0, 6.0, 7.0, 5.0, 2.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.001953125, -0.97222900390625, -0.9425048828125, -0.91278076171875, -0.883056640625, -0.85333251953125, -0.8236083984375, -0.79388427734375, -0.76416015625, -0.73443603515625, -0.7047119140625, -0.67498779296875, -0.645263671875, -0.61553955078125, -0.5858154296875, -0.55609130859375, -0.5263671875, -0.49664306640625, -0.4669189453125, -0.43719482421875, -0.407470703125, -0.37774658203125, -0.3480224609375, -0.31829833984375, -0.28857421875, -0.25885009765625, -0.2291259765625, -0.19940185546875, -0.169677734375, -0.13995361328125, -0.1102294921875, -0.08050537109375, -0.05078125, -0.02105712890625, 0.0086669921875, 0.03839111328125, 0.068115234375, 0.09783935546875, 0.1275634765625, 0.15728759765625, 0.18701171875, 0.21673583984375, 0.2464599609375, 0.27618408203125, 0.305908203125, 0.33563232421875, 0.3653564453125, 0.39508056640625, 0.4248046875, 0.45452880859375, 0.4842529296875, 0.51397705078125, 0.543701171875, 0.57342529296875, 0.6031494140625, 0.63287353515625, 0.66259765625, 0.69232177734375, 0.7220458984375, 0.75177001953125, 0.781494140625, 0.81121826171875, 0.8409423828125, 0.87066650390625, 0.900390625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 5.0, 7.0, 7.0, 12.0, 15.0, 17.0, 29.0, 26.0, 34.0, 38.0, 61.0, 91.0, 133.0, 122.0, 109.0, 71.0, 55.0, 41.0, 33.0, 21.0, 20.0, 11.0, 11.0, 8.0, 9.0, 6.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0005426406860351562, -0.0005280636250972748, -0.0005134865641593933, -0.0004989095032215118, -0.00048433244228363037, -0.0004697553813457489, -0.00045517832040786743, -0.00044060125946998596, -0.0004260241985321045, -0.000411447137594223, -0.00039687007665634155, -0.0003822930157184601, -0.0003677159547805786, -0.00035313889384269714, -0.0003385618329048157, -0.0003239847719669342, -0.00030940771102905273, -0.00029483065009117126, -0.0002802535891532898, -0.0002656765282154083, -0.00025109946727752686, -0.00023652240633964539, -0.00022194534540176392, -0.00020736828446388245, -0.00019279122352600098, -0.0001782141625881195, -0.00016363710165023804, -0.00014906004071235657, -0.0001344829797744751, -0.00011990591883659363, -0.00010532885789871216, -9.075179696083069e-05, -7.617473602294922e-05, -6.159767508506775e-05, -4.702061414718628e-05, -3.244355320930481e-05, -1.786649227142334e-05, -3.28943133354187e-06, 1.12876296043396e-05, 2.586469054222107e-05, 4.044175148010254e-05, 5.501881241798401e-05, 6.959587335586548e-05, 8.417293429374695e-05, 9.874999523162842e-05, 0.00011332705616950989, 0.00012790411710739136, 0.00014248117804527283, 0.0001570582389831543, 0.00017163529992103577, 0.00018621236085891724, 0.0002007894217967987, 0.00021536648273468018, 0.00022994354367256165, 0.0002445206046104431, 0.0002590976655483246, 0.00027367472648620605, 0.0002882517874240875, 0.000302828848361969, 0.00031740590929985046, 0.00033198297023773193, 0.0003465600311756134, 0.0003611370921134949, 0.00037571415305137634, 0.0003902912139892578]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 10.0, 4.0, 11.0, 15.0, 18.0, 26.0, 21.0, 58.0, 84.0, 109.0, 169.0, 264.0, 448.0, 714.0, 1296.0, 2518.0, 5460.0, 12868.0, 36071.0, 161801.0, 732239.0, 60105.0, 19017.0, 7596.0, 3470.0, 1772.0, 949.0, 543.0, 303.0, 183.0, 127.0, 90.0, 50.0, 49.0, 30.0, 22.0, 18.0, 5.0, 9.0, 6.0, 8.0, 0.0, 5.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.78955078125, -0.7683258056640625, -0.747100830078125, -0.7258758544921875, -0.70465087890625, -0.6834259033203125, -0.662200927734375, -0.6409759521484375, -0.6197509765625, -0.5985260009765625, -0.577301025390625, -0.5560760498046875, -0.53485107421875, -0.5136260986328125, -0.492401123046875, -0.4711761474609375, -0.449951171875, -0.4287261962890625, -0.407501220703125, -0.3862762451171875, -0.36505126953125, -0.3438262939453125, -0.322601318359375, -0.3013763427734375, -0.2801513671875, -0.2589263916015625, -0.237701416015625, -0.2164764404296875, -0.19525146484375, -0.1740264892578125, -0.152801513671875, -0.1315765380859375, -0.1103515625, -0.0891265869140625, -0.067901611328125, -0.0466766357421875, -0.02545166015625, -0.0042266845703125, 0.016998291015625, 0.0382232666015625, 0.0594482421875, 0.0806732177734375, 0.101898193359375, 0.1231231689453125, 0.14434814453125, 0.1655731201171875, 0.186798095703125, 0.2080230712890625, 0.229248046875, 0.2504730224609375, 0.271697998046875, 0.2929229736328125, 0.31414794921875, 0.3353729248046875, 0.356597900390625, 0.3778228759765625, 0.3990478515625, 0.4202728271484375, 0.441497802734375, 0.4627227783203125, 0.48394775390625, 0.5051727294921875, 0.526397705078125, 0.5476226806640625, 0.56884765625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 3.0, 1.0, 9.0, 8.0, 6.0, 9.0, 9.0, 14.0, 17.0, 25.0, 46.0, 51.0, 83.0, 91.0, 128.0, 142.0, 93.0, 71.0, 41.0, 24.0, 35.0, 20.0, 13.0, 11.0, 12.0, 12.0, 5.0, 6.0, 2.0, 6.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.3447265625, -1.3036956787109375, -1.262664794921875, -1.2216339111328125, -1.18060302734375, -1.1395721435546875, -1.098541259765625, -1.0575103759765625, -1.0164794921875, -0.9754486083984375, -0.934417724609375, -0.8933868408203125, -0.85235595703125, -0.8113250732421875, -0.770294189453125, -0.7292633056640625, -0.688232421875, -0.6472015380859375, -0.606170654296875, -0.5651397705078125, -0.52410888671875, -0.4830780029296875, -0.442047119140625, -0.4010162353515625, -0.3599853515625, -0.3189544677734375, -0.277923583984375, -0.2368927001953125, -0.19586181640625, -0.1548309326171875, -0.113800048828125, -0.0727691650390625, -0.03173828125, 0.0092926025390625, 0.050323486328125, 0.0913543701171875, 0.13238525390625, 0.1734161376953125, 0.214447021484375, 0.2554779052734375, 0.2965087890625, 0.3375396728515625, 0.378570556640625, 0.4196014404296875, 0.46063232421875, 0.5016632080078125, 0.542694091796875, 0.5837249755859375, 0.624755859375, 0.6657867431640625, 0.706817626953125, 0.7478485107421875, 0.78887939453125, 0.8299102783203125, 0.870941162109375, 0.9119720458984375, 0.9530029296875, 0.9940338134765625, 1.035064697265625, 1.0760955810546875, 1.11712646484375, 1.1581573486328125, 1.199188232421875, 1.2402191162109375, 1.28125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 3.0, 3.0, 8.0, 9.0, 15.0, 23.0, 39.0, 54.0, 98.0, 498.0, 113.0, 61.0, 34.0, 16.0, 9.0, 3.0, 5.0, 2.0, 8.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.201515197753906, -41.98759841918945, -40.773681640625, -39.55976867675781, -38.34585189819336, -37.131935119628906, -35.91801834106445, -34.7041015625, -33.49018859863281, -32.27627182006836, -31.06235694885254, -29.848440170288086, -28.634525299072266, -27.420608520507812, -26.20669174194336, -24.992774963378906, -23.778858184814453, -22.56494140625, -21.35102653503418, -20.137109756469727, -18.923194885253906, -17.709278106689453, -16.495361328125, -15.281445503234863, -14.067529678344727, -12.85361385345459, -11.639698028564453, -10.42578125, -9.211865425109863, -7.997949600219727, -6.784033298492432, -5.570116996765137, -4.356201171875, -3.142285108566284, -1.9283690452575684, -0.7144529819488525, 0.4994630813598633, 1.71337890625, 2.927295207977295, 4.14121150970459, 5.355127334594727, 6.569043159484863, 7.782959461212158, 8.996875762939453, 10.21079158782959, 11.424707412719727, 12.63862419128418, 13.852540016174316, 15.066455841064453, 16.280372619628906, 17.494287490844727, 18.70820426940918, 19.922119140625, 21.136035919189453, 22.349952697753906, 23.56386947631836, 24.77778434753418, 25.991701126098633, 27.205615997314453, 28.419532775878906, 29.63344955444336, 30.84736442565918, 32.061279296875, 33.27519607543945, 34.489112854003906]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 5.0, 1.0, 2.0, 5.0, 13.0, 7.0, 6.0, 5.0, 10.0, 8.0, 11.0, 16.0, 20.0, 21.0, 21.0, 29.0, 24.0, 19.0, 30.0, 72.0, 258.0, 159.0, 42.0, 25.0, 28.0, 20.0, 22.0, 13.0, 17.0, 15.0, 12.0, 11.0, 10.0, 5.0, 9.0, 6.0, 2.0, 6.0, 4.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.954437255859375, -21.240957260131836, -20.52747917175293, -19.81399917602539, -19.10051918029785, -18.387041091918945, -17.673561096191406, -16.9600830078125, -16.24660301208496, -15.533123970031738, -14.8196439743042, -14.106164932250977, -13.392685890197754, -12.679206848144531, -11.965726852416992, -11.25224781036377, -10.53876781463623, -9.825288772583008, -9.111808776855469, -8.398329734802246, -7.684850692749023, -6.971371173858643, -6.257891654968262, -5.544412612915039, -4.830933094024658, -4.117453575134277, -3.4039745330810547, -2.690495014190674, -1.977015733718872, -1.2635364532470703, -0.5500569343566895, 0.1634221076965332, 0.8769016265869141, 1.5903809070587158, 2.3038601875305176, 3.0173397064208984, 3.7308189868927, 4.444298267364502, 5.157777786254883, 5.8712568283081055, 6.584736347198486, 7.298215866088867, 8.01169490814209, 8.725173950195312, 9.438653945922852, 10.152132987976074, 10.865612030029297, 11.579092025756836, 12.292571067810059, 13.006050109863281, 13.71953010559082, 14.433009147644043, 15.146488189697266, 15.859968185424805, 16.573448181152344, 17.28692626953125, 18.00040626525879, 18.713886260986328, 19.427364349365234, 20.140844345092773, 20.854324340820312, 21.56780242919922, 22.281282424926758, 22.994762420654297, 23.708240509033203]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 4.0, 4.0, 5.0, 9.0, 16.0, 13.0, 15.0, 12.0, 26.0, 17.0, 23.0, 31.0, 34.0, 48.0, 132.0, 245.0, 88.0, 45.0, 36.0, 33.0, 29.0, 18.0, 25.0, 22.0, 12.0, 9.0, 10.0, 14.0, 4.0, 5.0, 5.0, 6.0, 4.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.486328125, -2.407073974609375, -2.32781982421875, -2.248565673828125, -2.1693115234375, -2.090057373046875, -2.01080322265625, -1.931549072265625, -1.852294921875, -1.773040771484375, -1.69378662109375, -1.614532470703125, -1.5352783203125, -1.456024169921875, -1.37677001953125, -1.297515869140625, -1.21826171875, -1.139007568359375, -1.05975341796875, -0.980499267578125, -0.9012451171875, -0.821990966796875, -0.74273681640625, -0.663482666015625, -0.584228515625, -0.504974365234375, -0.42572021484375, -0.346466064453125, -0.2672119140625, -0.187957763671875, -0.10870361328125, -0.029449462890625, 0.0498046875, 0.129058837890625, 0.20831298828125, 0.287567138671875, 0.3668212890625, 0.446075439453125, 0.52532958984375, 0.604583740234375, 0.683837890625, 0.763092041015625, 0.84234619140625, 0.921600341796875, 1.0008544921875, 1.080108642578125, 1.15936279296875, 1.238616943359375, 1.31787109375, 1.397125244140625, 1.47637939453125, 1.555633544921875, 1.6348876953125, 1.714141845703125, 1.79339599609375, 1.872650146484375, 1.951904296875, 2.031158447265625, 2.11041259765625, 2.189666748046875, 2.2689208984375, 2.348175048828125, 2.42742919921875, 2.506683349609375, 2.5859375]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 4.0, 4.0, 0.0, 0.0, 0.0, 2.0, 5.0, 4.0, 5.0, 2.0, 7.0, 13.0, 33.0, 24.0, 30.0, 58.0, 49.0, 113.0, 225.0, 635.0, 2216.0, 15102.0, 8354459.0, 12634.0, 1943.0, 519.0, 225.0, 104.0, 43.0, 21.0, 22.0, 20.0, 20.0, 7.0, 5.0, 10.0, 5.0, 4.0, 2.0, 2.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0], "bins": [-29.67580223083496, -28.761919021606445, -27.84803581237793, -26.934152603149414, -26.0202693939209, -25.106386184692383, -24.192502975463867, -23.27861976623535, -22.364736557006836, -21.45085334777832, -20.536970138549805, -19.62308692932129, -18.709203720092773, -17.795320510864258, -16.881437301635742, -15.967554092407227, -15.053671836853027, -14.139788627624512, -13.225905418395996, -12.31202220916748, -11.398138999938965, -10.484256744384766, -9.57037353515625, -8.656490325927734, -7.7426066398620605, -6.828723430633545, -5.914840221405029, -5.000957489013672, -4.087074279785156, -3.1731910705566406, -2.259307861328125, -1.3454246520996094, -0.43154144287109375, 0.4823417067527771, 1.396224856376648, 2.310107946395874, 3.2239911556243896, 4.137874126434326, 5.051757335662842, 5.965640544891357, 6.879523754119873, 7.793406963348389, 8.707289695739746, 9.621172904968262, 10.535056114196777, 11.448939323425293, 12.362822532653809, 13.276705741882324, 14.19058895111084, 15.104472160339355, 16.018354415893555, 16.93223762512207, 17.846120834350586, 18.7600040435791, 19.673887252807617, 20.587770462036133, 21.50165367126465, 22.415536880493164, 23.32942008972168, 24.243303298950195, 25.15718650817871, 26.071069717407227, 26.984952926635742, 27.898836135864258, 28.812719345092773]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 5.0, 2.0, 4.0, 3.0, 8.0, 5.0, 1.0, 3.0, 2.0, 3.0, 1.0, 4.0, 4.0, 2.0, 4.0, 3.0, 3.0, 3.0, 3.0, 3.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-21.674331665039062, -20.998470306396484, -20.322607040405273, -19.646745681762695, -18.970884323120117, -18.295021057128906, -17.619159698486328, -16.94329833984375, -16.267436981201172, -15.591574668884277, -14.9157133102417, -14.239850997924805, -13.563989639282227, -12.888127326965332, -12.212265014648438, -11.53640365600586, -10.860540390014648, -10.184678077697754, -9.508816719055176, -8.832954406738281, -8.157093048095703, -7.481230735778809, -6.805368423461914, -6.129506587982178, -5.453644752502441, -4.777782917022705, -4.101921081542969, -3.426058769226074, -2.750196933746338, -2.0743350982666016, -1.398472785949707, -0.7226109504699707, -0.04674720764160156, 0.6291147470474243, 1.3049767017364502, 1.9808387756347656, 2.656700611114502, 3.3325624465942383, 4.008424758911133, 4.684286594390869, 5.3601484298706055, 6.036010265350342, 6.711872100830078, 7.387734413146973, 8.063596725463867, 8.739458084106445, 9.41532039642334, 10.091182708740234, 10.767044067382812, 11.442906379699707, 12.118767738342285, 12.79463005065918, 13.470491409301758, 14.146353721618652, 14.822216033935547, 15.498077392578125, 16.173938751220703, 16.84980010986328, 17.525663375854492, 18.20152473449707, 18.87738609313965, 19.55324935913086, 20.229110717773438, 20.904972076416016, 21.580835342407227]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 9.0, 5.0, 8.0, 11.0, 12.0, 8.0, 19.0, 37.0, 30.0, 39.0, 80.0, 96.0, 143.0, 216.0, 375.0, 767.0, 1754.0, 4839.0, 13939.0, 42735.0, 140101.0, 207724.0, 75123.0, 23374.0, 7757.0, 2671.0, 1080.0, 488.0, 265.0, 165.0, 114.0, 76.0, 50.0, 38.0, 26.0, 29.0, 19.0, 8.0, 15.0, 8.0, 6.0, 4.0, 2.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.734375, -20.110595703125, -19.48681640625, -18.863037109375, -18.2392578125, -17.615478515625, -16.99169921875, -16.367919921875, -15.744140625, -15.120361328125, -14.49658203125, -13.872802734375, -13.2490234375, -12.625244140625, -12.00146484375, -11.377685546875, -10.75390625, -10.130126953125, -9.50634765625, -8.882568359375, -8.2587890625, -7.635009765625, -7.01123046875, -6.387451171875, -5.763671875, -5.139892578125, -4.51611328125, -3.892333984375, -3.2685546875, -2.644775390625, -2.02099609375, -1.397216796875, -0.7734375, -0.149658203125, 0.47412109375, 1.097900390625, 1.7216796875, 2.345458984375, 2.96923828125, 3.593017578125, 4.216796875, 4.840576171875, 5.46435546875, 6.088134765625, 6.7119140625, 7.335693359375, 7.95947265625, 8.583251953125, 9.20703125, 9.830810546875, 10.45458984375, 11.078369140625, 11.7021484375, 12.325927734375, 12.94970703125, 13.573486328125, 14.197265625, 14.821044921875, 15.44482421875, 16.068603515625, 16.6923828125, 17.316162109375, 17.93994140625, 18.563720703125, 19.1875]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 4.0, 7.0, 7.0, 9.0, 23.0, 22.0, 22.0, 36.0, 56.0, 49.0, 79.0, 84.0, 103.0, 101.0, 90.0, 74.0, 67.0, 42.0, 35.0, 32.0, 16.0, 15.0, 8.0, 7.0, 4.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.314453125, -3.196685791015625, -3.07891845703125, -2.961151123046875, -2.8433837890625, -2.725616455078125, -2.60784912109375, -2.490081787109375, -2.372314453125, -2.254547119140625, -2.13677978515625, -2.019012451171875, -1.9012451171875, -1.783477783203125, -1.66571044921875, -1.547943115234375, -1.43017578125, -1.312408447265625, -1.19464111328125, -1.076873779296875, -0.9591064453125, -0.841339111328125, -0.72357177734375, -0.605804443359375, -0.488037109375, -0.370269775390625, -0.25250244140625, -0.134735107421875, -0.0169677734375, 0.100799560546875, 0.21856689453125, 0.336334228515625, 0.4541015625, 0.571868896484375, 0.68963623046875, 0.807403564453125, 0.9251708984375, 1.042938232421875, 1.16070556640625, 1.278472900390625, 1.396240234375, 1.514007568359375, 1.63177490234375, 1.749542236328125, 1.8673095703125, 1.985076904296875, 2.10284423828125, 2.220611572265625, 2.33837890625, 2.456146240234375, 2.57391357421875, 2.691680908203125, 2.8094482421875, 2.927215576171875, 3.04498291015625, 3.162750244140625, 3.280517578125, 3.398284912109375, 3.51605224609375, 3.633819580078125, 3.7515869140625, 3.869354248046875, 3.98712158203125, 4.104888916015625, 4.22265625]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 6.0, 6.0, 5.0, 4.0, 11.0, 14.0, 23.0, 35.0, 60.0, 68.0, 78.0, 57.0, 31.0, 35.0, 16.0, 13.0, 5.0, 5.0, 4.0, 0.0, 1.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.380627632141113, -13.786942481994629, -13.193258285522461, -12.599573135375977, -12.005888938903809, -11.412203788757324, -10.818519592285156, -10.224834442138672, -9.631149291992188, -9.037464141845703, -8.443779945373535, -7.850094795227051, -7.256410598754883, -6.662725448608398, -6.069040775299072, -5.475356101989746, -4.881671905517578, -4.287987232208252, -3.694302558898926, -3.1006176471710205, -2.5069329738616943, -1.9132483005523682, -1.319563388824463, -0.7258787155151367, -0.13219404220581055, 0.4614906907081604, 1.0551754236221313, 1.648860216140747, 2.2425448894500732, 2.8362295627593994, 3.4299144744873047, 4.023599147796631, 4.617284774780273, 5.2109694480896, 5.804654121398926, 6.39833927154541, 6.992023468017578, 7.5857086181640625, 8.179393768310547, 8.773077964782715, 9.366762161254883, 9.960447311401367, 10.554131507873535, 11.14781665802002, 11.741500854492188, 12.335186004638672, 12.928871154785156, 13.522555351257324, 14.116240501403809, 14.709925651550293, 15.303609848022461, 15.897294998168945, 16.49098014831543, 17.08466339111328, 17.678348541259766, 18.27203369140625, 18.865718841552734, 19.45940399169922, 20.053089141845703, 20.646772384643555, 21.24045753479004, 21.834142684936523, 22.427827835083008, 23.02151107788086, 23.615196228027344]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 4.0, 3.0, 3.0, 4.0, 6.0, 8.0, 8.0, 10.0, 22.0, 70.0, 110.0, 109.0, 49.0, 25.0, 14.0, 5.0, 9.0, 3.0, 5.0, 8.0, 1.0, 6.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.935245513916016, -16.340185165405273, -15.745122909545898, -15.150062561035156, -14.555001258850098, -13.959939956665039, -13.364879608154297, -12.769818305969238, -12.17475700378418, -11.579695701599121, -10.984634399414062, -10.38957405090332, -9.794512748718262, -9.199451446533203, -8.604391098022461, -8.009329795837402, -7.414268493652344, -6.819207191467285, -6.224146366119385, -5.629085540771484, -5.034024238586426, -4.438962936401367, -3.843902111053467, -3.2488412857055664, -2.653779983520508, -2.0587189197540283, -1.4636578559875488, -0.8685967922210693, -0.27353572845458984, 0.32152533531188965, 0.9165863990783691, 1.5116472244262695, 2.106710433959961, 2.7017714977264404, 3.29683256149292, 3.8918936252593994, 4.486954689025879, 5.0820159912109375, 5.677076816558838, 6.272137641906738, 6.867198944091797, 7.4622602462768555, 8.057321548461914, 8.652381896972656, 9.247443199157715, 9.842504501342773, 10.437564849853516, 11.032626152038574, 11.627687454223633, 12.222748756408691, 12.81781005859375, 13.412870407104492, 14.00793170928955, 14.60299301147461, 15.198053359985352, 15.79311466217041, 16.38817596435547, 16.98323631286621, 17.578298568725586, 18.173358917236328, 18.768421173095703, 19.363481521606445, 19.958541870117188, 20.553604125976562, 21.148664474487305]}, "_wandb": {"runtime": 4105}}